Skip to content

Commit 836f822

Browse files
committed
Bump version to 1.0.4
1 parent a17ec1e commit 836f822

File tree

3 files changed

+10
-5
lines changed

3 files changed

+10
-5
lines changed

examples/training/ms_marco/multilingual/translate_queries.py

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,16 @@
33
44
For machine translation, we use EasyNMT: https://github.com/UKPLab/EasyNMT
55
You can install it via: pip install easynmt
6+
7+
Usage:
8+
python translate_queries [target_language]
69
"""
710
import os
811
from sentence_transformers import LoggingHandler, util
912
import logging
1013
import tarfile
1114
from easynmt import EasyNMT
15+
import sys
1216

1317
#### Just some code to print debug information to stdout
1418
logging.basicConfig(format='%(asctime)s - %(message)s',
@@ -17,8 +21,10 @@
1721
handlers=[LoggingHandler()])
1822
#### /print debug information to stdout
1923

20-
target_lang = 'de'
24+
target_lang = sys.argv[1]
2125
output_folder = 'multilingual-data'
26+
data_folder = '../msmarco-data'
27+
2228
output_filename = os.path.join(output_folder, 'train_queries.en-{}.tsv'.format(target_lang))
2329
os.makedirs(output_folder, exist_ok=True)
2430

@@ -32,7 +38,6 @@
3238
translated_qids.add(splits[0])
3339

3440
### Now we read the MS Marco dataset
35-
data_folder = '../msmarco-data'
3641
os.makedirs(data_folder, exist_ok=True)
3742

3843
# Read qrels file for relevant positives per query
@@ -78,5 +83,5 @@
7883

7984
with open(output_filename, 'a' if os.path.exists(output_filename) else 'w', encoding='utf8') as fOut:
8085
for qid, query, translated_query in zip(qids, queries, translation_model.translate_stream(queries, source_lang='en', target_lang=target_lang, beam_size=2, perform_sentence_splitting=False, chunk_size=256, batch_size=64)):
81-
fOut.write("{}\t{}\t{}\n".format(qid, query.replace("\t", " "), translated_query.replace("\t", " ")))
86+
fOut.write("{}\t{}\t{}\n".format(qid, translated_query.replace("\t", " ")))
8287
fOut.flush()

sentence_transformers/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
__version__ = "1.0.3"
1+
__version__ = "1.0.4"
22
__DOWNLOAD_SERVER__ = 'http://sbert.net/models/'
33
from .datasets import SentencesDataset, ParallelSentencesDataset
44
from .LoggingHandler import LoggingHandler

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77

88
setup(
99
name="sentence-transformers",
10-
version="1.0.3",
10+
version="1.0.4",
1111
author="Nils Reimers",
1212
author_email="[email protected]",
1313
description="Sentence Embeddings using BERT / RoBERTa / XLM-R",

0 commit comments

Comments
 (0)