We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ab9ff16 commit df9a5efCopy full SHA for df9a5ef
poc/seq2seq1.py
@@ -221,8 +221,8 @@ def collate_fn(batch):
221
222
def train_model():
223
# Load and preprocess data
224
- english_data = open("../synthetic_data/news-commentary-v12.zh-en.en").readlines()
225
- chinese_data = open("../synthetic_data/news-commentary-v12.zh-en.zh").readlines()
+ english_data = open("../synthetic_data/news-commentary-v12.zh-en.en").readlines()[1:3000]
+ chinese_data = open("../synthetic_data/news-commentary-v12.zh-en.zh").readlines()[1:3000]
226
227
# Tokenize data
228
english_tokenized = [sentence.strip().split() for sentence in english_data]
0 commit comments