abdullahmubeen10 commited on
Commit
8d64fe0
·
verified ·
1 Parent(s): 445b449

Upload 75 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .streamlit/config.toml +3 -0
  2. Demo.py +149 -0
  3. Dockerfile +72 -0
  4. inputs/opus_mt_cpp_en/Example1.txt +2 -0
  5. inputs/opus_mt_cpp_en/Example2.txt +2 -0
  6. inputs/opus_mt_cpp_en/Example3.txt +2 -0
  7. inputs/opus_mt_cpp_en/Example4.txt +2 -0
  8. inputs/opus_mt_cpp_en/Example5.txt +2 -0
  9. inputs/opus_mt_cpp_en/Example6.txt +2 -0
  10. inputs/opus_mt_cpp_en/Example7.txt +2 -0
  11. inputs/opus_mt_de_en/Example1.txt +2 -0
  12. inputs/opus_mt_de_en/Example2.txt +2 -0
  13. inputs/opus_mt_de_en/Example3.txt +2 -0
  14. inputs/opus_mt_de_en/Example4.txt +2 -0
  15. inputs/opus_mt_de_en/Example5.txt +2 -0
  16. inputs/opus_mt_de_en/Example6.txt +2 -0
  17. inputs/opus_mt_de_en/Example7.txt +2 -0
  18. inputs/opus_mt_en_cpp/Example1.txt +2 -0
  19. inputs/opus_mt_en_cpp/Example2.txt +2 -0
  20. inputs/opus_mt_en_cpp/Example3.txt +2 -0
  21. inputs/opus_mt_en_cpp/Example4.txt +2 -0
  22. inputs/opus_mt_en_cpp/Example5.txt +2 -0
  23. inputs/opus_mt_en_cpp/Example6.txt +2 -0
  24. inputs/opus_mt_en_cpp/Example7.txt +2 -0
  25. inputs/opus_mt_en_de/Example1.txt +2 -0
  26. inputs/opus_mt_en_de/Example2.txt +2 -0
  27. inputs/opus_mt_en_de/Example3.txt +2 -0
  28. inputs/opus_mt_en_de/Example4.txt +2 -0
  29. inputs/opus_mt_en_de/Example5.txt +2 -0
  30. inputs/opus_mt_en_de/Example6.txt +2 -0
  31. inputs/opus_mt_en_de/Example7.txt +2 -0
  32. inputs/opus_mt_en_es/Example1.txt +2 -0
  33. inputs/opus_mt_en_es/Example2.txt +2 -0
  34. inputs/opus_mt_en_es/Example3.txt +2 -0
  35. inputs/opus_mt_en_es/Example4.txt +2 -0
  36. inputs/opus_mt_en_es/Example5.txt +2 -0
  37. inputs/opus_mt_en_es/Example6.txt +2 -0
  38. inputs/opus_mt_en_es/Example7.txt +2 -0
  39. inputs/opus_mt_en_fr/Example1.txt +2 -0
  40. inputs/opus_mt_en_fr/Example2.txt +2 -0
  41. inputs/opus_mt_en_fr/Example3.txt +2 -0
  42. inputs/opus_mt_en_fr/Example4.txt +2 -0
  43. inputs/opus_mt_en_fr/Example5.txt +2 -0
  44. inputs/opus_mt_en_fr/Example6.txt +2 -0
  45. inputs/opus_mt_en_fr/Example7.txt +2 -0
  46. inputs/opus_mt_en_it/Example1.txt +2 -0
  47. inputs/opus_mt_en_it/Example2.txt +2 -0
  48. inputs/opus_mt_en_it/Example3.txt +2 -0
  49. inputs/opus_mt_en_it/Example4.txt +2 -0
  50. inputs/opus_mt_en_it/Example5.txt +2 -0
.streamlit/config.toml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ [theme]
2
+ base="light"
3
+ primaryColor="#29B4E8"
Demo.py ADDED
@@ -0,0 +1,149 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ import sparknlp
3
+ import os
4
+
5
+ from sparknlp.base import *
6
+ from sparknlp.common import *
7
+ from sparknlp.annotator import *
8
+ from pyspark.ml import Pipeline
9
+ from sparknlp.pretrained import PretrainedPipeline
10
+
11
+ # Page Configuration
12
+ st.set_page_config(
13
+ layout="wide",
14
+ initial_sidebar_state="auto"
15
+ )
16
+
17
+ # Custom CSS for Styling
18
+ st.markdown("""
19
+ <style>
20
+ .main-title {
21
+ font-size: 36px;
22
+ color: #4A90E2;
23
+ font-weight: bold;
24
+ text-align: center;
25
+ }
26
+ .section {
27
+ background-color: #f9f9f9;
28
+ padding: 10px;
29
+ border-radius: 10px;
30
+ margin-top: 10px;
31
+ }
32
+ .section p, .section ul {
33
+ color: #666666;
34
+ }
35
+ </style>
36
+ """, unsafe_allow_html=True)
37
+
38
+ # Initialize Spark NLP
39
+ @st.cache_resource
40
+ def init_spark():
41
+ return sparknlp.start()
42
+
43
+ # Create a Spark NLP Pipeline for MarianTransformer
44
+ @st.cache_resource
45
+ def create_pipeline(model_name):
46
+ document_assembler = DocumentAssembler()\
47
+ .setInputCol("text")\
48
+ .setOutputCol("document")
49
+
50
+ sentence_detector = SentenceDetectorDLModel()\
51
+ .pretrained("sentence_detector_dl", "xx")\
52
+ .setInputCols(["document"])\
53
+ .setOutputCol("sentences")
54
+
55
+ marian_translator = MarianTransformer.pretrained(model_name, "xx")\
56
+ .setInputCols(["sentences"])\
57
+ .setOutputCol("translation")
58
+
59
+ return Pipeline(stages=[document_assembler, sentence_detector, marian_translator])
60
+
61
+ # Process the Input Text Through the Pipeline
62
+ def fit_data(pipeline, text):
63
+ data = spark.createDataFrame([[text]]).toDF("text")
64
+ result = pipeline.fit(data).transform(data)
65
+ return result.select('translation.result').collect()
66
+
67
+ # Title and Subtitle
68
+ title = 'Multilingual Text Translation with Spark NLP and MarianMT'
69
+ sub_title = """
70
+ The MarianTransformer is a powerful, state-of-the-art machine translation model based on the Transformer architecture. Developed by the MarianMT project, this annotator supports over 1,000 translation directions, making it one of the most versatile tools for multilingual natural language processing. Integrated within Spark NLP, the MarianTransformer Annotator allows for scalable and efficient text translation, leveraging the parallel processing capabilities of Apache Spark. Whether you're translating large documents or handling multiple languages simultaneously, this tool ensures high-quality translations with minimal latency.
71
+ """
72
+
73
+ st.markdown(f'<div class="main-title">{title}</div>', unsafe_allow_html=True)
74
+ st.markdown(f'<div class="section"><p>{sub_title}</p></div>', unsafe_allow_html=True)
75
+
76
+ # Mapping Models to Descriptions
77
+ model_mappings = {
78
+ "opus_mt_en_fr": "Translate text from English to French",
79
+ "opus_mt_en_it": "Translate text from English to Italian",
80
+ "opus_mt_en_es": "Translate text from English to Spanish",
81
+ "opus_mt_en_de": "Translate text from English to German",
82
+ "opus_mt_en_cpp": "Translate text from English to Portuguese",
83
+ "opus_mt_fr_en": "Translate text from French to English",
84
+ "opus_mt_it_en": "Translate text from Italian to English",
85
+ "opus_mt_es_en": "Translate text from Spanish to English",
86
+ "opus_mt_de_en": "Translate text from German to English",
87
+ "opus_mt_cpp_en": "Translate text from Portuguese to English"
88
+ }
89
+
90
+ # Sidebar for Language Selection
91
+ st.sidebar.title("Language Selection")
92
+
93
+ language_mapping = {
94
+ "English": 'en',
95
+ "French": 'fr',
96
+ "Italian": 'it',
97
+ "Spanish": 'es',
98
+ "German": 'de',
99
+ "Portuguese": 'cpp'
100
+ }
101
+
102
+ from_language = st.sidebar.selectbox("Translate From", list(language_mapping.keys()))
103
+
104
+ if from_language == 'English':
105
+ to_language = st.sidebar.selectbox("Translate To", ['French', 'Italian', 'Spanish', 'German', 'Portuguese'])
106
+ else:
107
+ to_language = st.sidebar.selectbox("Translate To", ['English'])
108
+
109
+ selected_model = f'opus_mt_{language_mapping[from_language]}_{language_mapping[to_language]}'
110
+ st.subheader(model_mappings[selected_model])
111
+
112
+ # Reference Notebook Link in Sidebar
113
+ link= """<a href="https://colab.research.google.com/github/JohnSnowLabs/spark-nlp-workshop/blob/master/tutorials/streamlit_notebooks/TRANSLATION_MARIAN.ipynb"><img src="https://colab.research.google.com/assets/colab-badge.svg" style="zoom: 1.3" alt="Open In Colab"/></a>"""
114
+ st.sidebar.title('')
115
+ st.sidebar.markdown('Reference notebook:')
116
+ st.sidebar.markdown(link, unsafe_allow_html=True)
117
+
118
+ # Load Sample Text Files
119
+ folder_path = f"inputs/{selected_model}"
120
+ examples = [
121
+ lines[1].strip()
122
+ for filename in os.listdir(folder_path)
123
+ if filename.endswith('.txt')
124
+ for lines in [open(os.path.join(folder_path, filename), 'r', encoding='utf-8').readlines()]
125
+ if len(lines) >= 2
126
+ ]
127
+
128
+ selected_text = st.selectbox("Select a Sample Text", examples)
129
+ custom_input = st.text_input("Try it for yourself!")
130
+
131
+ if custom_input:
132
+ selected_text = custom_input
133
+
134
+ # Display the Selected or Entered Text
135
+ st.subheader('Selected Text')
136
+ st.write(selected_text)
137
+
138
+ # Perform Translation and Display the Result
139
+ st.subheader("Translation Result")
140
+
141
+ spark = init_spark()
142
+ pipeline = create_pipeline(selected_model)
143
+ output = fit_data(pipeline, selected_text)
144
+
145
+ res = "".join(output[0][0])
146
+ HTML_WRAPPER = """<div class="scroll entities" style="overflow-x: auto; border: 1px solid #e6e9ef; border-radius: 0.25rem; padding: 1rem; margin-bottom: 2.5rem; white-space:pre-wrap">{}</div>"""
147
+ st.markdown(HTML_WRAPPER.format(res), unsafe_allow_html=True)
148
+
149
+
Dockerfile ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Download base image ubuntu 18.04
2
+ FROM ubuntu:18.04
3
+
4
+ # Set environment variables
5
+ ENV NB_USER jovyan
6
+ ENV NB_UID 1000
7
+ ENV HOME /home/${NB_USER}
8
+ ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64/
9
+
10
+ # Install required packages
11
+ RUN apt-get update && apt-get install -y \
12
+ tar \
13
+ wget \
14
+ bash \
15
+ rsync \
16
+ gcc \
17
+ libfreetype6-dev \
18
+ libhdf5-serial-dev \
19
+ libpng-dev \
20
+ libzmq3-dev \
21
+ python3 \
22
+ python3-dev \
23
+ python3-pip \
24
+ unzip \
25
+ pkg-config \
26
+ software-properties-common \
27
+ graphviz \
28
+ openjdk-8-jdk \
29
+ ant \
30
+ ca-certificates-java \
31
+ && apt-get clean \
32
+ && update-ca-certificates -f
33
+
34
+ # Install Python 3.8 and pip
35
+ RUN add-apt-repository ppa:deadsnakes/ppa \
36
+ && apt-get update \
37
+ && apt-get install -y python3.8 python3-pip \
38
+ && apt-get clean
39
+
40
+ # Set up JAVA_HOME
41
+ RUN echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64/" >> /etc/profile \
42
+ && echo "export PATH=\$JAVA_HOME/bin:\$PATH" >> /etc/profile
43
+ # Create a new user named "jovyan" with user ID 1000
44
+ RUN useradd -m -u ${NB_UID} ${NB_USER}
45
+
46
+ # Switch to the "jovyan" user
47
+ USER ${NB_USER}
48
+
49
+ # Set home and path variables for the user
50
+ ENV HOME=/home/${NB_USER} \
51
+ PATH=/home/${NB_USER}/.local/bin:$PATH
52
+
53
+ # Set up PySpark to use Python 3.8 for both driver and workers
54
+ ENV PYSPARK_PYTHON=/usr/bin/python3.8
55
+ ENV PYSPARK_DRIVER_PYTHON=/usr/bin/python3.8
56
+
57
+ # Set the working directory to the user's home directory
58
+ WORKDIR ${HOME}
59
+
60
+ # Upgrade pip and install Python dependencies
61
+ RUN python3.8 -m pip install --upgrade pip
62
+ COPY requirements.txt /tmp/requirements.txt
63
+ RUN python3.8 -m pip install -r /tmp/requirements.txt
64
+
65
+ # Copy the application code into the container at /home/jovyan
66
+ COPY --chown=${NB_USER}:${NB_USER} . ${HOME}
67
+
68
+ # Expose port for Streamlit
69
+ EXPOSE 7860
70
+
71
+ # Define the entry point for the container
72
+ ENTRYPOINT ["streamlit", "run", "Demo.py", "--server.port=7860", "--server.address=0.0.0.0"]
inputs/opus_mt_cpp_en/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Além de ser o rei do norte, John Snow é um médico inglês e líder no desenvolvimento de anestesia e higiene médica. Ele é considerado o primeiro a usar dados para curar surto de cólera em 1854.
inputs/opus_mt_cpp_en/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic é um romance épico americano de 1997, um filme de desastre dirigido, escrito, co-produzido e co-editado por James Cameron. Incorporando aspectos históricos e ficcionalizados, é baseado em relatos do naufrágio do RMS Titanic. É estrelado por Leonardo DiCaprio e Kate Winslet como membros de diferentes classes sociais que se apaixonam a bordo do navio durante sua viagem inaugural malfadada.
inputs/opus_mt_cpp_en/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (nascido em 28 de outubro de 1955) é um magnata dos negócios, desenvolvedor de software, investidor e filantropo americano. Ele é mais conhecido como o co-fundador da Microsoft Corporation. Durante sua carreira na Microsoft, Gates ocupou os cargos de presidente do conselho, diretor executivo (CEO), presidente e arquiteto-chefe de software. Ele também foi o maior acionista individual até maio de 2014. É um dos mais conhecidos empreendedores e pioneiros da revolução do microcomputador das décadas de 1970 e 1980.
inputs/opus_mt_cpp_en/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ A Mona Lisa é uma pintura a óleo do século 16 criada por Leonardo. É realizado no Louvre, em Paris.
inputs/opus_mt_cpp_en/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ O Facebook é um serviço de rede social lançado como TheFacebook em 4 de fevereiro de 2004. Foi fundado por Mark Zuckerberg com seus colegas de faculdade e colegas da Universidade de Harvard Eduardo Saverin, Andrew McCollum, Dustin Moskovitz e Chris Hughes. A associação do site foi inicialmente limitada pelos fundadores aos alunos de Harvard, mas foi expandida para outras faculdades na área de Boston, a Ivy League e, gradualmente, a maioria das universidades nos Estados Unidos e Canadá.
inputs/opus_mt_cpp_en/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton é um psicólogo cognitivo e cientista da computação canadense inglês, mais conhecido por seu trabalho em redes neurais artificiais. Desde 2013, ele divide seu tempo trabalhando para o Google e a Universidade de Toronto. Em 2017, ele foi cofundador e se tornou o assessor científico-chefe do Vector Institute em Toronto.
inputs/opus_mt_cpp_en/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ Quando eu disse a John que queria me mudar para o Alasca, ele me avisou que teria problemas para encontrar um Starbucks lá.
inputs/opus_mt_de_en/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ John Snow ist ein englischer Arzt und ein Führer in der Entwicklung der Anästhesie des Nordens.. Er ist der erste, der Daten verwendet, um Choleraausbruch 1854 zu heilen.
inputs/opus_mt_de_en/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic ist ein US-amerikanischer Film von James Cameron.. Sie umfasst sowohl historische als auch fiktionalisierte Aspekte, basiert auf Konten der Versenken der RMS Titanic.. Es spielt Leonardo DiCaprio und Kate Winslet als Mitglieder der verschiedenen sozialen Klassen. Sie verliebt sich in das Schiff während seiner unglückselige Mädchen.
inputs/opus_mt_de_en/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ Oktober 1955 in New York City) ist ein US-amerikanischer Software-Entwickler, Investor und Philanthrop.. Während seiner Karriere bei Microsoft, Gates war die Positionen von Vorsitzender, Chief Executive Officer (CEO), Präsident und Chef Software Architekt.. Bis Mai 2014 war er der größte Einzelaktionär.. Er ist einer der bekanntesten Unternehmer und Pioniere der Mikrocomputerrevolution der 1970er und 1980er Jahre.
inputs/opus_mt_de_en/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ Die Mona Lisa ist ein Ölgemälde aus dem 16.. Es wird im Louvre in Paris gehalten.
inputs/opus_mt_de_en/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook ist ein Social Network Service am 4. Februar 2004.. Es wurde von Mark Zuckerberg mit seinen College-Mitbewohnern und anderen Harvard-Universitätsstudenten Eduardo Saverin, Andrew McCollum, Dustin Moskovitz gegründet.. Die Mitgliedschaft der Website wurde zunächst von Harvard Studenten, aber auch auf andere Hochschulen in der Boston, die Ivy League und allmählich die meisten Universitäten in den Vereinigten Staaten
inputs/opus_mt_de_en/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton ist ein kanadischer Psychologe und Computer.. Seit 2013 arbeitet er für Google und die University of Toronto.. 2017 wurde er wissenschaftlicher Berater des Vector Institute in Toronto.
inputs/opus_mt_de_en/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ Als ich John sagte, dass ich nach Alaska ziehen wollte, dass ich Probleme hatte, dass ich ein Starbucks dort haben würde, er mich, dass ich hatte, dass ich hatte, dass ich
inputs/opus_mt_en_cpp/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
inputs/opus_mt_en_cpp/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
inputs/opus_mt_en_cpp/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
inputs/opus_mt_en_cpp/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
inputs/opus_mt_en_cpp/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
inputs/opus_mt_en_cpp/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
inputs/opus_mt_en_cpp/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
inputs/opus_mt_en_de/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
inputs/opus_mt_en_de/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
inputs/opus_mt_en_de/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
inputs/opus_mt_en_de/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
inputs/opus_mt_en_de/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
inputs/opus_mt_en_de/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
inputs/opus_mt_en_de/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
inputs/opus_mt_en_es/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
inputs/opus_mt_en_es/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
inputs/opus_mt_en_es/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
inputs/opus_mt_en_es/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
inputs/opus_mt_en_es/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
inputs/opus_mt_en_es/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
inputs/opus_mt_en_es/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
inputs/opus_mt_en_fr/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
inputs/opus_mt_en_fr/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
inputs/opus_mt_en_fr/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
inputs/opus_mt_en_fr/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
inputs/opus_mt_en_fr/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.
inputs/opus_mt_en_fr/Example6.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example6.txt
2
+ Geoffrey Everest Hinton is an English Canadian cognitive psychologist and computer scientist, most noted for his work on artificial neural networks. Since 2013 he divides his time working for Google and the University of Toronto. In 2017, he cofounded and became the Chief Scientific Advisor of the Vector Institute in Toronto.
inputs/opus_mt_en_fr/Example7.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example7.txt
2
+ When I told John that I wanted to move to Alaska, he warned me that I'd have trouble finding a Starbucks there.
inputs/opus_mt_en_it/Example1.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example1.txt
2
+ Other than being the king of the north, John Snow is a an english physician and a leader in the development of anaesthesia and medical hygiene. He is considered for being the first one using data to cure cholera outbreak in 1854.
inputs/opus_mt_en_it/Example2.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example2.txt
2
+ Titanic is a 1997 American epic romance and disaster film directed, written, co-produced, and co-edited by James Cameron. Incorporating both historical and fictionalized aspects, it is based on accounts of the sinking of the RMS Titanic. It stars Leonardo DiCaprio and Kate Winslet as members of different social classes who fall in love aboard the ship during its ill-fated maiden voyage.
inputs/opus_mt_en_it/Example3.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example3.txt
2
+ William Henry Gates III (born October 28, 1955) is an American business magnate, software developer, investor, and philanthropist. He is best known as the co-founder of Microsoft Corporation. During his career at Microsoft, Gates held the positions of chairman, chief executive officer (CEO), president and chief software architect. He was also being the largest individual shareholder until May 2014. He is one of the best-known entrepreneurs and pioneers of the microcomputer revolution of the 1970s and 1980s.
inputs/opus_mt_en_it/Example4.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example4.txt
2
+ The Mona Lisa is a 16th century oil painting created by Leonardo. It's held at the Louvre in Paris.
inputs/opus_mt_en_it/Example5.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Example5.txt
2
+ Facebook is a social networking service launched as TheFacebook on February 4, 2004. It was founded by Mark Zuckerberg with his college roommates and fellow Harvard University students Eduardo Saverin, Andrew McCollum, Dustin Moskovitz and Chris Hughes. The website's membership was initially limited by the founders to Harvard students, but was expanded to other colleges in the Boston area, the Ivy League, and gradually most universities in the United States and Canada.