@inproceedings{9366091f29934b4784dd066f1d809bb8,
title = "From multilingual web-archives to parallel treebanks in five minutes",
abstract = "The Tree-to-Tree (t2t) Alignment Pipe is a collection of Python scripts, generating automatically aligned parallel treebanks from multilingual web resources or existing parallel corpora. The pipe contains wrappers for a number of freely available NLP software programs. Once these third party programs have been installed and the system and corpus specific details have been updated, the pipe is designed to generate a parallel treebank with a single program call from a unix command line. We discuss alignment quality on a fully automatically processed parallel corpus.",
keywords = "parallel treebank, automatic tree-to-tree alignment, TreeAligner, Text-und-Berg",
author = "Markus Killer and Rico Sennrich and Martin Volk",
year = "2011",
month = sep,
day = "1",
language = "English",
series = "Arbeiten zur Mehrsprachigkeit - Folge B",
publisher = "Universit{\"a}t Hamburg",
pages = "57--62",
editor = "H Hedeland and T Schmidt and K W{\"o}rner",
booktitle = "Conference of the German Society for Computational Linguistics and Language Technology (GSCL) 2011",
note = "Conference of the German Society for Computational Linguistics and Language Technology (GSCL) 2011 ; Conference date: 28-09-2011 Through 30-09-2011",
}