Spaces:
Sleeping
Sleeping
Upload 75 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .streamlit/config.toml +3 -0
- Demo.py +149 -0
- Dockerfile +72 -0
- inputs/opus_mt_cpp_en/Example1.txt +2 -0
- inputs/opus_mt_cpp_en/Example2.txt +2 -0
- inputs/opus_mt_cpp_en/Example3.txt +2 -0
- inputs/opus_mt_cpp_en/Example4.txt +2 -0
- inputs/opus_mt_cpp_en/Example5.txt +2 -0
- inputs/opus_mt_cpp_en/Example6.txt +2 -0
- inputs/opus_mt_cpp_en/Example7.txt +2 -0
- inputs/opus_mt_de_en/Example1.txt +2 -0
- inputs/opus_mt_de_en/Example2.txt +2 -0
- inputs/opus_mt_de_en/Example3.txt +2 -0
- inputs/opus_mt_de_en/Example4.txt +2 -0
- inputs/opus_mt_de_en/Example5.txt +2 -0
- inputs/opus_mt_de_en/Example6.txt +2 -0
- inputs/opus_mt_de_en/Example7.txt +2 -0
- inputs/opus_mt_en_cpp/Example1.txt +2 -0
- inputs/opus_mt_en_cpp/Example2.txt +2 -0
- inputs/opus_mt_en_cpp/Example3.txt +2 -0
- inputs/opus_mt_en_cpp/Example4.txt +2 -0
- inputs/opus_mt_en_cpp/Example5.txt +2 -0
- inputs/opus_mt_en_cpp/Example6.txt +2 -0
- inputs/opus_mt_en_cpp/Example7.txt +2 -0
- inputs/opus_mt_en_de/Example1.txt +2 -0
- inputs/opus_mt_en_de/Example2.txt +2 -0
- inputs/opus_mt_en_de/Example3.txt +2 -0
- inputs/opus_mt_en_de/Example4.txt +2 -0
- inputs/opus_mt_en_de/Example5.txt +2 -0
- inputs/opus_mt_en_de/Example6.txt +2 -0
- inputs/opus_mt_en_de/Example7.txt +2 -0
- inputs/opus_mt_en_es/Example1.txt +2 -0
- inputs/opus_mt_en_es/Example2.txt +2 -0
- inputs/opus_mt_en_es/Example3.txt +2 -0
- inputs/opus_mt_en_es/Example4.txt +2 -0
- inputs/opus_mt_en_es/Example5.txt +2 -0
- inputs/opus_mt_en_es/Example6.txt +2 -0
- inputs/opus_mt_en_es/Example7.txt +2 -0
- inputs/opus_mt_en_fr/Example1.txt +2 -0
- inputs/opus_mt_en_fr/Example2.txt +2 -0
- inputs/opus_mt_en_fr/Example3.txt +2 -0
- inputs/opus_mt_en_fr/Example4.txt +2 -0
- inputs/opus_mt_en_fr/Example5.txt +2 -0
- inputs/opus_mt_en_fr/Example6.txt +2 -0
- inputs/opus_mt_en_fr/Example7.txt +2 -0
- inputs/opus_mt_en_it/Example1.txt +2 -0
- inputs/opus_mt_en_it/Example2.txt +2 -0
- inputs/opus_mt_en_it/Example3.txt +2 -0
- inputs/opus_mt_en_it/Example4.txt +2 -0
- inputs/opus_mt_en_it/Example5.txt +2 -0
.streamlit/config.toml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
[theme]
|
2 |
+
base="light"
|
3 |
+
primaryColor="#29B4E8"
|
Demo.py
ADDED
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import streamlit as st
|
2 |
+
import sparknlp
|
3 |
+
import os
|
4 |
+
|
5 |
+
from sparknlp.base import *
|
6 |
+
from sparknlp.common import *
|
7 |
+
from sparknlp.annotator import *
|
8 |
+
from pyspark.ml import Pipeline
|
9 |
+
from sparknlp.pretrained import PretrainedPipeline
|
10 |
+
|
11 |
+
# Page Configuration
|
12 |
+
st.set_page_config(
|
13 |
+
layout="wide",
|
14 |
+
initial_sidebar_state="auto"
|
15 |
+
)
|
16 |
+
|
17 |
+
# Custom CSS for Styling
|
18 |
+
st.markdown("""
|
19 |
+
<style>
|
20 |
+
.main-title {
|
21 |
+
font-size: 36px;
|
22 |
+
color: #4A90E2;
|
23 |
+
font-weight: bold;
|
24 |
+
text-align: center;
|
25 |
+
}
|
26 |
+
.section {
|
27 |
+
background-color: #f9f9f9;
|
28 |
+
padding: 10px;
|
29 |
+
border-radius: 10px;
|
30 |
+
margin-top: 10px;
|
31 |
+
}
|
32 |
+
.section p, .section ul {
|
33 |
+
color: #666666;
|
34 |
+
}
|
35 |
+
</style>
|
36 |
+
""", unsafe_allow_html=True)
|
37 |
+
|
38 |
+
# Initialize Spark NLP
|
39 |
+
@st.cache_resource
|
40 |
+
def init_spark():
|
41 |
+
return sparknlp.start()
|
42 |
+
|
43 |
+
# Create a Spark NLP Pipeline for MarianTransformer
|
44 |
+
@st.cache_resource
|
45 |
+
def create_pipeline(model_name):
|
46 |
+
document_assembler = DocumentAssembler()\
|
47 |
+
.setInputCol("text")\
|
48 |
+
.setOutputCol("document")
|
49 |
+
|
50 |
+
sentence_detector = SentenceDetectorDLModel()\
|
51 |
+
.pretrained("sentence_detector_dl", "xx")\
|
52 |
+
.setInputCols(["document"])\
|
53 |
+
.setOutputCol("sentences")
|
54 |
+
|
55 |
+
marian_translator = MarianTransformer.pretrained(model_name, "xx")\
|
56 |
+
.setInputCols(["sentences"])\
|
57 |
+
.setOutputCol("translation")
|
58 |
+
|
59 |
+
return Pipeline(stages=[document_assembler, sentence_detector, marian_translator])
|
60 |
+
|
61 |
+
# Process the Input Text Through the Pipeline
|
62 |
+
def fit_data(pipeline, text):
|
63 |
+
data = spark.createDataFrame([[text]]).toDF("text")
|
64 |
+
result = pipeline.fit(data).transform(data)
|
65 |
+
return result.select('translation.result').collect()
|
66 |
+
|
67 |
+
# Title and Subtitle
|
68 |
+
title = 'Multilingual Text Translation with Spark NLP and MarianMT'
|
69 |
+
sub_title = """
|
70 |
+
The MarianTransformer is a powerful, state-of-the-art machine translation model based on the Transformer architecture. Developed by the MarianMT project, this annotator supports over 1,000 translation directions, making it one of the most versatile tools for multilingual natural language processing. Integrated within Spark NLP, the MarianTransformer Annotator allows for scalable and efficient text translation, leveraging the parallel processing capabilities of Apache Spark. Whether you're translating large documents or handling multiple languages simultaneously, this tool ensures high-quality translations with minimal latency.
|
71 |
+
"""
|
72 |
+
|
73 |
+
st.markdown(f'<div class="main-title">{title}</div>', unsafe_allow_html=True)
|
74 |
+
st.markdown(f'<div class="section"><p>{sub_title}</p></div>', unsafe_allow_html=True)
|
75 |
+
|
76 |
+
# Mapping Models to Descriptions
|
77 |
+
model_mappings = {
|
78 |
+
"opus_mt_en_fr": "Translate text from English to French",
|
79 |
+
"opus_mt_en_it": "Translate text from English to Italian",
|
80 |
+
"opus_mt_en_es": "Translate text from English to Spanish",
|
81 |
+
"opus_mt_en_de": "Translate text from English to German",
|
82 |
+
"opus_mt_en_cpp": "Translate text from English to Portuguese",
|
83 |
+
"opus_mt_fr_en": "Translate text from French to English",
|
84 |
+
"opus_mt_it_en": "Translate text from Italian to English",
|
85 |
+
"opus_mt_es_en": "Translate text from Spanish to English",
|
86 |
+
"opus_mt_de_en": "Translate text from German to English",
|
87 |
+
"opus_mt_cpp_en": "Translate text from Portuguese to English"
|
88 |
+
}
|
89 |
+
|
90 |
+
# Sidebar for Language Selection
|
91 |
+
st.sidebar.title("Language Selection")
|
92 |
+
|
93 |
+
language_mapping = {
|
94 |
+
"English": 'en',
|
95 |
+
"French": 'fr',
|
96 |
+
"Italian": 'it',
|
97 |
+
"Spanish": 'es',
|
98 |
+
"German": 'de',
|
99 |
+
"Portuguese": 'cpp'
|
100 |
+
}
|
101 |
+
|
102 |
+
from_language = st.sidebar.selectbox("Translate From", list(language_mapping.keys()))
|
103 |
+
|
104 |
+
if from_language == 'English':
|
105 |
+
to_language = st.sidebar.selectbox("Translate To", ['French', 'Italian', 'Spanish', 'German', 'Portuguese'])
|
106 |
+
else:
|
107 |
+
to_language = st.sidebar.selectbox("Translate To", ['English'])
|
108 |
+
|
109 |
+
selected_model = f'opus_mt_{language_mapping[from_language]}_{language_mapping[to_language]}'
|
110 |
+
st.subheader(model_mappings[selected_model])
|
111 |
+
|
112 |
+
# Reference Notebook Link in Sidebar
|
113 |
+
link= """<a href="https://colab.research.google.com/github/JohnSnowLabs/spark-nlp-workshop/blob/master/tutorials/streamlit_notebooks/TRANSLATION_MARIAN.ipynb"><img src="https://colab.research.google.com/assets/colab-badge.svg" style="zoom: 1.3" alt="Open In Colab"/></a>"""
|
114 |
+
st.sidebar.title('')
|
115 |
+
st.sidebar.markdown('Reference notebook:')
|
116 |
+
st.sidebar.markdown(link, unsafe_allow_html=True)
|
117 |
+
|
118 |
+
# Load Sample Text Files
|
119 |
+
folder_path = f"inputs/{selected_model}"
|
120 |
+
examples = [
|
121 |
+
lines[1].strip()
|
122 |
+
for filename in os.listdir(folder_path)
|
123 |
+
if filename.endswith('.txt')
|
124 |
+
for lines in [open(os.path.join(folder_path, filename), 'r', encoding='utf-8').readlines()]
|
125 |
+
if len(lines) >= 2
|
126 |
+
]
|
127 |
+
|
128 |
+
selected_text = st.selectbox("Select a Sample Text", examples)
|
129 |
+
custom_input = st.text_input("Try it for yourself!")
|
130 |
+
|
131 |
+
if custom_input:
|
132 |
+
selected_text = custom_input
|
133 |
+
|
134 |
+
# Display the Selected or Entered Text
|
135 |
+
st.subheader('Selected Text')
|
136 |
+
st.write(selected_text)
|
137 |
+
|
138 |
+
# Perform Translation and Display the Result
|
139 |
+
st.subheader("Translation Result")
|
140 |
+
|
141 |
+
spark = init_spark()
|
142 |
+
pipeline = create_pipeline(selected_model)
|
143 |
+
output = fit_data(pipeline, selected_text)
|
144 |
+
|
145 |
+
res = "".join(output[0][0])
|
146 |
+
HTML_WRAPPER = """<div class="scroll entities" style="overflow-x: auto; border: 1px solid #e6e9ef; border-radius: 0.25rem; padding: 1rem; margin-bottom: 2.5rem; white-space:pre-wrap">{}</div>"""
|
147 |
+
st.markdown(HTML_WRAPPER.format(res), unsafe_allow_html=True)
|
148 |
+
|
149 |
+
|
Dockerfile
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Download base image ubuntu 18.04
|
2 |
+
FROM ubuntu:18.04
|
3 |
+
|
4 |
+
# Set environment variables
|
5 |
+
ENV NB_USER jovyan
|
6 |
+
ENV NB_UID 1000
|
7 |
+
ENV HOME /home/${NB_USER}
|
8 |
+
ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64/
|
9 |
+
|
10 |
+
# Install required packages
|
11 |
+
RUN apt-get update && apt-get install -y \
|
12 |
+
tar \
|
13 |
+
wget \
|
14 |
+
bash \
|
15 |
+
rsync \
|
16 |
+
gcc \
|
17 |
+
libfreetype6-dev \
|
18 |
+
libhdf5-serial-dev \
|
19 |
+
libpng-dev \
|
20 |
+
libzmq3-dev \
|
21 |
+
python3 \
|
22 |
+
python3-dev \
|
23 |
+
python3-pip \
|
24 |
+
unzip \
|
25 |
+
pkg-config \
|
26 |
+
software-properties-common \
|
27 |
+
graphviz \
|
28 |
+
openjdk-8-jdk \
|
29 |
+
ant \
|
30 |
+
ca-certificates-java \
|
31 |
+
&& apt-get clean \
|
32 |
+
&& update-ca-certificates -f
|
33 |
+
|
34 |
+
# Install Python 3.8 and pip
|
35 |
+
RUN add-apt-repository ppa:deadsnakes/ppa \
|
36 |
+
&& apt-get update \
|
37 |
+
&& apt-get install -y python3.8 python3-pip \
|
38 |
+
&& apt-get clean
|
39 |
+
|
40 |
+
# Set up JAVA_HOME
|
41 |
+
RUN echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64/" >> /etc/profile \
|
42 |
+
&& echo "export PATH=\$JAVA_HOME/bin:\$PATH" >> /etc/profile
|
43 |
+
# Create a new user named "jovyan" with user ID 1000
|
44 |
+
RUN useradd -m -u ${NB_UID} ${NB_USER}
|
45 |
+
|
46 |
+
# Switch to the "jovyan" user
|
47 |
+
USER ${NB_USER}
|
48 |
+
|
49 |
+
# Set home and path variables for the user
|
50 |
+
ENV HOME=/home/${NB_USER} \
|
51 |
+
PATH=/home/${NB_USER}/.local/bin:$PATH
|
52 |
+
|
53 |
+
# Set up PySpark to use Python 3.8 for both driver and workers
|
54 |
+
ENV PYSPARK_PYTHON=/usr/bin/python3.8
|
55 |
+
ENV PYSPARK_DRIVER_PYTHON=/usr/bin/python3.8
|
56 |
+
|
57 |
+
# Set the working directory to the user's home directory
|
58 |
+
WORKDIR ${HOME}
|
59 |
+
|
60 |
+
# Upgrade pip and install Python dependencies
|
61 |
+
RUN python3.8 -m pip install --upgrade pip
|
62 |
+
COPY requirements.txt /tmp/requirements.txt
|
63 |
+
RUN python3.8 -m pip install -r /tmp/requirements.txt
|
64 |
+
|
65 |
+
# Copy the application code into the container at /home/jovyan
|
66 |
+
COPY --chown=${NB_USER}:${NB_USER} . ${HOME}
|
67 |
+
|
68 |
+
# Expose port for Streamlit
|
69 |
+
EXPOSE 7860
|
70 |
+
|
71 |
+
# Define the entry point for the container
|
72 |
+
ENTRYPOINT ["streamlit", "run", "Demo.py", "--server.port=7860", "--server.address=0.0.0.0"]
|
inputs/opus_mt_cpp_en/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Além de ser o rei do norte, John Snow é um médico inglês e líder no desenvolvimento de anestesia e higiene médica. Ele é considerado o primeiro a usar dados para curar surto de cólera em 1854.
|
inputs/opus_mt_cpp_en/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic é um romance épico americano de 1997, um filme de desastre dirigido, escrito, co-produzido e co-editado por James Cameron. Incorporando aspectos históricos e ficcionalizados, é baseado em relatos do naufrágio do RMS Titanic. É estrelado por Leonardo DiCaprio e Kate Winslet como membros de diferentes classes sociais que se apaixonam a bordo do navio durante sua viagem inaugural malfadada.
|
inputs/opus_mt_cpp_en/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (nascido em 28 de outubro de 1955) é um magnata dos negócios, desenvolvedor de software, investidor e filantropo americano. Ele é mais conhecido como o co-fundador da Microsoft Corporation. Durante sua carreira na Microsoft, Gates ocupou os cargos de presidente do conselho, diretor executivo (CEO), presidente e arquiteto-chefe de software. Ele também foi o maior acionista individual até maio de 2014. É um dos mais conhecidos empreendedores e pioneiros da revolução do microcomputador das décadas de 1970 e 1980.
|
inputs/opus_mt_cpp_en/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
A Mona Lisa é uma pintura a óleo do século 16 criada por Leonardo. É realizado no Louvre, em Paris.
|
inputs/opus_mt_cpp_en/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
O Facebook é um serviço de rede social lançado como TheFacebook em 4 de fevereiro de 2004. Foi fundado por Mark Zuckerberg com seus colegas de faculdade e colegas da Universidade de Harvard Eduardo Saverin, Andrew McCollum, Dustin Moskovitz e Chris Hughes. A associação do site foi inicialmente limitada pelos fundadores aos alunos de Harvard, mas foi expandida para outras faculdades na área de Boston, a Ivy League e, gradualmente, a maioria das universidades nos Estados Unidos e Canadá.
|
inputs/opus_mt_cpp_en/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton é um psicólogo cognitivo e cientista da computação canadense inglês, mais conhecido por seu trabalho em redes neurais artificiais. Desde 2013, ele divide seu tempo trabalhando para o Google e a Universidade de Toronto. Em 2017, ele foi cofundador e se tornou o assessor científico-chefe do Vector Institute em Toronto.
|
inputs/opus_mt_cpp_en/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
Quando eu disse a John que queria me mudar para o Alasca, ele me avisou que teria problemas para encontrar um Starbucks lá.
|
inputs/opus_mt_de_en/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
John Snow ist ein englischer Arzt und ein Führer in der Entwicklung der Anästhesie des Nordens.. Er ist der erste, der Daten verwendet, um Choleraausbruch 1854 zu heilen.
|
inputs/opus_mt_de_en/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic ist ein US-amerikanischer Film von James Cameron.. Sie umfasst sowohl historische als auch fiktionalisierte Aspekte, basiert auf Konten der Versenken der RMS Titanic.. Es spielt Leonardo DiCaprio und Kate Winslet als Mitglieder der verschiedenen sozialen Klassen. Sie verliebt sich in das Schiff während seiner unglückselige Mädchen.
|
inputs/opus_mt_de_en/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
Oktober 1955 in New York City) ist ein US-amerikanischer Software-Entwickler, Investor und Philanthrop.. Während seiner Karriere bei Microsoft, Gates war die Positionen von Vorsitzender, Chief Executive Officer (CEO), Präsident und Chef Software Architekt.. Bis Mai 2014 war er der größte Einzelaktionär.. Er ist einer der bekanntesten Unternehmer und Pioniere der Mikrocomputerrevolution der 1970er und 1980er Jahre.
|
inputs/opus_mt_de_en/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
Die Mona Lisa ist ein Ölgemälde aus dem 16.. Es wird im Louvre in Paris gehalten.
|
inputs/opus_mt_de_en/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook ist ein Social Network Service am 4. Februar 2004.. Es wurde von Mark Zuckerberg mit seinen College-Mitbewohnern und anderen Harvard-Universitätsstudenten Eduardo Saverin, Andrew McCollum, Dustin Moskovitz gegründet.. Die Mitgliedschaft der Website wurde zunächst von Harvard Studenten, aber auch auf andere Hochschulen in der Boston, die Ivy League und allmählich die meisten Universitäten in den Vereinigten Staaten
|
inputs/opus_mt_de_en/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton ist ein kanadischer Psychologe und Computer.. Seit 2013 arbeitet er für Google und die University of Toronto.. 2017 wurde er wissenschaftlicher Berater des Vector Institute in Toronto.
|
inputs/opus_mt_de_en/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
Als ich John sagte, dass ich nach Alaska ziehen wollte, dass ich Probleme hatte, dass ich ein Starbucks dort haben würde, er mich, dass ich hatte, dass ich hatte, dass ich
|
inputs/opus_mt_en_cpp/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
|
inputs/opus_mt_en_cpp/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
|
inputs/opus_mt_en_cpp/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
|
inputs/opus_mt_en_cpp/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
|
inputs/opus_mt_en_cpp/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
|
inputs/opus_mt_en_cpp/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
|
inputs/opus_mt_en_cpp/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
|
inputs/opus_mt_en_de/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
|
inputs/opus_mt_en_de/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
|
inputs/opus_mt_en_de/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
|
inputs/opus_mt_en_de/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
|
inputs/opus_mt_en_de/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
|
inputs/opus_mt_en_de/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
|
inputs/opus_mt_en_de/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
|
inputs/opus_mt_en_es/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
|
inputs/opus_mt_en_es/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
|
inputs/opus_mt_en_es/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
|
inputs/opus_mt_en_es/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
|
inputs/opus_mt_en_es/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
|
inputs/opus_mt_en_es/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
|
inputs/opus_mt_en_es/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
|
inputs/opus_mt_en_fr/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
|
inputs/opus_mt_en_fr/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
|
inputs/opus_mt_en_fr/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
|
inputs/opus_mt_en_fr/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
|
inputs/opus_mt_en_fr/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
|
inputs/opus_mt_en_fr/Example6.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example6.txt
|
2 |
+
Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
|
inputs/opus_mt_en_fr/Example7.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example7.txt
|
2 |
+
When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
|
inputs/opus_mt_en_it/Example1.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example1.txt
|
2 |
+
Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
|
inputs/opus_mt_en_it/Example2.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example2.txt
|
2 |
+
Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
|
inputs/opus_mt_en_it/Example3.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example3.txt
|
2 |
+
William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
|
inputs/opus_mt_en_it/Example4.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example4.txt
|
2 |
+
The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
|
inputs/opus_mt_en_it/Example5.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
Example5.txt
|
2 |
+
Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
|