SimulStreaming/simulstreaming_translate.py at main · ufal/SimulStreaming · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
import sys
import os
import ctranslate2
import sentencepiece as spm
import transformers
import json
import time
#import select

def generate_words(sp, step_results):
    tokens_buffer = []

    for step_result in step_results:
        is_new_word = step_result.token.startswith("▁")

        if is_new_word and tokens_buffer:
            word = sp.decode(tokens_buffer)
            if word:
                yield word
            tokens_buffer = []

        tokens_buffer.append(step_result.token_id)

    if tokens_buffer:
        word = sp.decode(tokens_buffer)
        if word:
            yield word

from simulstreaming.translate.sentence_segmenter import SentenceSegmenter

class LLMTranslator:

    def __init__(self, system_prompt='Please translate.', max_context_length=4096, len_ratio=None, model_dir="ct2_EuroLLM-9B-Instruct/", tokenizer_dir="EuroLLM-9B-Instruct/"):
        self.system_prompt = system_prompt

        print("Loading the model...", file=sys.stderr)
        self.generator = ctranslate2.Generator(model_dir, device="cuda")
        self.sp = spm.SentencePieceProcessor(os.path.join(tokenizer_dir,"tokenizer.model"))
        self.tokenizer = transformers.AutoTokenizer.from_pretrained(tokenizer_dir)
        print("...done", file=sys.stderr)

        self.max_context_length = max_context_length

        self.max_tokens_to_trim = self.max_context_length - 10
        self.len_ratio = len_ratio

        # my regex sentence segmenter
        self.segmenter = SentenceSegmenter()

    def start_dialog(self):
        return [{'role':'system', 'content': self.system_prompt }]

    def build_prompt(self, dialog):
        # Build prompt with system + user + generation prompt (assistant turn marker),
        base_toks = self.tokenizer.apply_chat_template(dialog[:2], tokenize=True, add_generation_prompt=True)["input_ids"]
        if len(dialog) == 3:  # if there is assistant message
            # then append the forced assistant content tokens.
            forced_toks = self.tokenizer.encode(dialog[2]['content'], add_special_tokens=False)
            toks = base_toks + forced_toks
        else:
            toks = base_toks
        print("len toks:", len(toks), file=sys.stderr)

        c = self.tokenizer.convert_ids_to_tokens(toks)
        return c

    def translate(self, src, tgt_forced=""):

        dialog = self.start_dialog()
        dialog += [{'role':'user','content': src}]
        if tgt_forced != "":
            dialog += [{'role':'assistant','content': tgt_forced}]

        prompt_tokens = self.build_prompt(dialog)
        if self.len_ratio is not None:
            limit_len = int(len(self.tokenizer.encode(src)) * self.len_ratio) + 10
            limit_kw = {'max_length': limit_len}
        else:
            limit_kw = {}
        step_results = self.generator.generate_tokens(
            prompt_tokens,
            **limit_kw,
        )

        res = []
        for step_result in step_results:
            res.append(step_result)

        return self.sp.decode([r.token_id for r in res])

class ParallelTextBuffer:
    def __init__(self, tokenizer, max_tokens, trimming="segments", init_src="", init_tgt=""):
        self.tokenizer = tokenizer
        self.max_tokens = max_tokens

        self.src_buffer = []  # list of lists
        if init_src:
            self.src_buffer.append(init_src)

        self.tgt_buffer = []  # list of strings
        if init_tgt:
            self.tgt_buffer.append(init_tgt)

        self.trimming = trimming
        if self.trimming == "sentences":
            self.segmenter = SentenceSegmenter()

    def len_src(self):
        return sum(len(t) for t in self.src_buffer) + len(self.src_buffer) - 1

    def insert(self, src, tgt):
        self.src_buffer.append(src)
        self.tgt_buffer.append(tgt)

    def insert_src_suffix(self, s):
        if self.src_buffer:
            self.src_buffer[-1][-1] += s
        else:
            self.src_buffer.append([s])

    def trim_sentences(self):

        src = " ".join(" ".join(b) for b in self.src_buffer)
        tgt = "".join(self.tgt_buffer)

        src_sp_toks = self.tokenizer.encode(src)
        tgt_sp_toks = self.tokenizer.encode(tgt)


        def trim_sentence(text):
            sents = self.segmenter(text)
            print("SENTS:", len(sents), sents, file=sys.stderr)
            return "".join(sents[1:])

        while len(src_sp_toks) + len(tgt_sp_toks) > self.max_tokens:
            nsrc = trim_sentence(src)
            ntgt = trim_sentence(tgt)
            if not nsrc or not ntgt:
                print("src or tgt is empty after trimming.", file=sys.stderr)
                print("src: ", src, file=sys.stderr)
                print("tgt: ", tgt, file=sys.stderr)
                break
            src = nsrc
            tgt = ntgt
            src_sp_toks = self.tokenizer.encode(src)
            tgt_sp_toks = self.tokenizer.encode(tgt)
            print("TRIMMED SRC:", (src,), file=sys.stderr)
            print("TRIMMED TGT:", (tgt,), file=sys.stderr)

        self.src_buffer = [src.split()]
        self.tgt_buffer = [tgt]
        return src, tgt

    def trim_segments(self):
        print("BUFFER:", file=sys.stderr)
        for s,t in zip(self.src_buffer, self.tgt_buffer):
            print("\t", s,"...",t,file=sys.stderr) #,self.src_buffer, self.tgt_buffer, file=sys.stderr)
        src = " ".join(" ".join(b) for b in self.src_buffer)
        tgt = "".join(self.tgt_buffer)

        src_sp_toks = self.tokenizer.encode(src)
        tgt_sp_toks = self.tokenizer.encode(tgt)

        while len(src_sp_toks) + len(tgt_sp_toks) > self.max_tokens:
            if len(self.src_buffer) > 1 and len(self.tgt_buffer) > 1:
                self.src_buffer.pop(0)
                self.tgt_buffer.pop(0)
            else:
                break
            src = " ".join(" ".join(b) for b in self.src_buffer)
            tgt = "".join(self.tgt_buffer)

            src_sp_toks = self.tokenizer.encode(src)
            tgt_sp_toks = self.tokenizer.encode(tgt)

        print("TRIMMED SEGMENTS SRC:", (src,), file=sys.stderr)
        print("TRIMMED SEGMENTS TGT:", (tgt,), file=sys.stderr)

        return src, tgt

    def trim(self):
        if self.trimming == "sentences":
            return self.trim_sentences()
        return self.trim_segments()


class SimulLLM:

    def __init__(self, llmtrans, min_len=0, chunk=1, trimming="sentences", language="ja", init_src="", init_tgt=""):
        self.llmtranslator = llmtrans

        self.min_len = min_len

        self.step = chunk
        self.language = language
        if language in ["ja", "zh"]:
            self.specific_space = ""
        else:
            self.specific_space = " "

        self.trimming = trimming
        self.init_src = init_src
        self.init_tgt = init_tgt

        self.init()

    def init(self):
        self.buffer = ParallelTextBuffer(self.llmtranslator.tokenizer, self.llmtranslator.max_tokens_to_trim, trimming=self.trimming, init_src=self.init_src, init_tgt=self.init_tgt)

        self.last_inserted = []
        self.last_unconfirmed = ""


    def insert(self, src):
        if isinstance(src, str):
            self.last_inserted.append(src)
        else:
            self.last_inserted += src

    def insert_suffix(self, text):
        '''
        Insert suffix of a word to the last inserted word.
        It may be because the word was split to multiple parts in the input, each with different timestamps.
        '''
        if self.last_inserted:
            self.last_inserted[-1] += text
        elif self.buffer.src_buffer:
            self.buffer.insert_src_suffix(text)
        else:
            # this shouldn't happen
            self.last_inserted.append(text)

    def trim_longest_common_prefix(self, a,b):
        if self.language not in ["ja", "zh"]:
            a = a.split()
            b = b.split()
        i = 0
        for i,(x,y) in enumerate(zip(a,b)):
            if x != y:
                break
        if self.language in ["ja", "zh"]:
            #print("tady160",(a, b, i), file=sys.stderr)
            return a[:i], b[i:]
        else:
            return " ".join(a[:i]), " ".join(b[i:])

    def process_iter(self, is_final=False):
        print("IS FINAL:", is_final, file=sys.stderr)
        if not is_final and self.buffer.len_src() + len(self.last_inserted) < self.min_len:
            return ("COMPLETE", "", "")

        src, forced_tgt = self.buffer.trim()

        confirmed_out = ""
        run = False
        for i in range(2):
            if i == 0:
                # first, catch up all but the last chunk.
                w = self.last_inserted[:-self.step]
                if not w:
                    continue
            else:
                w = self.last_inserted[-self.step:]
                if len(w) < self.step and not is_final:
                    # do not process the last incomplete chunk, wait for more input
                    # (unless it's final)
                    continue
            if w:
                src += " " + " ".join(w)
                run = True

            print("SRC",src,file=sys.stderr)

            print("FORCED TGT",forced_tgt,file=sys.stderr)
            out = self.llmtranslator.translate(src, forced_tgt)
            print("OUT",out,file=sys.stderr)
            confirmed, unconfirmed = self.trim_longest_common_prefix(self.last_unconfirmed, out)
            self.last_unconfirmed = unconfirmed
            if confirmed:
                confirmed_out += self.specific_space + confirmed
            print("CONFIRMED NOW:",confirmed,file=sys.stderr)
            yield ("INCOMPLETE", confirmed_out, unconfirmed)

            print(file=sys.stderr)
            print(file=sys.stderr)
        print("#################",file=sys.stderr)
        if run:
            self.buffer.insert(self.last_inserted, confirmed_out)
            self.last_inserted = []

        ret = confirmed_out
        print("RET:",ret,file=sys.stderr)
        yield ("COMPLETE", ret, self.last_unconfirmed)

    def finish(self):
        # assume you always going to refresh after finish
        yield ("COMPLETE", self.last_unconfirmed, "")

### default prompts

lan_to_name = {
    "de": "German",
    "ja": "Japanese",
    "zh-tr": "Chinese Traditional",
    "zh-sim": "Chinese Simplified",
    "cs": "Czech",
    "hu": "Hungarian",
    "en": "English",


    # EuroLLM languages
    # TODO: check, it's by ChatGPT.
    "bg": "Bulgarian",
    "hr": "Croatian",
#    "cs": "Czech",
    "da": "Danish",
    "nl": "Dutch",
#    "en": "English",
    "et": "Estonian",
    "fi": "Finnish",
    "fr": "French",
#    "de": "German",
    "el": "Greek",
#    "hu": "Hungarian",
    "ga": "Irish",
    "it": "Italian",
    "lv": "Latvian",
    "lt": "Lithuanian",
    "mt": "Maltese",
    "pl": "Polish",
    "pt": "Portuguese",
    "ro": "Romanian",
    "sk": "Slovak",
    "sl": "Slovenian",
    "es": "Spanish",
    "sv": "Swedish",
    "ar": "Arabic",
    "ca": "Catalan",
#    "zh": "Chinese",
    "gl": "Galician",
    "hi": "Hindi",
#    "ja": "Japanese",
    "ko": "Korean",
    "no": "Norwegian",
    "ru": "Russian",
    "tr": "Turkish",
    "uk": "Ukrainian"
}

SrcLang = "English"  # TODO: default parameters.
TgtLang = "German"
default_prompt="You are simultaneous interpreter from {SrcLang} to {TgtLang}. We are at a conference. It is important that you translate " + \
                "only what you hear, nothing else!"

default_init = "Please, go ahead, you can start with your presentation, we are ready."

default_inits_tgt = {
    "en": default_init,
    'de': "Bitte schön, Sie können mit Ihrer Präsentation beginnen, wir sind bereit.",
    'ja': "どうぞ、プレゼンテーションを始めてください。",  # # Please go ahead and start your presentation.  # this is in English
    'zh-tr': "請繼續，您可以開始您的簡報，我們已經準備好了。",
    'zh-sim': "请吧，你可以开始发言了，我们已经准备好了。",
    'cs': "Prosím, můžete začít s prezentací, jsme připraveni.",
    "hu": "Kérlek, kezdheted a prezentációdat, készen állunk."
}

# how many times is target text longer than English
# This was an attempt to stop generation if translation is longer than this ration of the source, to prevent hallucinations.
# TODO: not tested rigorously.
lan_thresholds = {
    'de': 1.3,   # 12751/9817  ... the proportion of subword tokens for ACL6060 dev de vs. en text, for EuroLLM-9B-Instruct tokenizer
    'ja': 1.34,  # 13187/9817
    'zh': 1.23,  # 12115/9817
    'zh-tr': 1.23, # 12115/9817
    'zh-sim': 1.23, # 12115/9817

    # TODO: guessed, not measured:
    'hu': 1.34,
   # 'cs': I don't know    # guessed
}

from simulstreaming.translate.hovercraft import *

lan_choices = sorted(set(list(lan_to_name.keys())+list(hovercraft_translations.keys())))

def translate_args(parser):
    parser.add_argument('--min-chunk-size', type=int, default=1,
                        help='Minimum number of space-delimited words to process in each LocalAgreement update. The more, the higher quality, but slower.')
    parser.add_argument('--min-len', type=int, default=1,
                        help='Minimum number of space-delimited words at the beginning.')
    #parser.add_argument('--start_at', type=int, default=0, help='Skip first N words.')

    parser.add_argument('--src-lan', '--src-language', type=str, default="en",
                        help="Source language code.",
                        choices=lan_choices)

    parser.add_argument('--tgt-lan', '--tgt-language', type=str, default="de",
                        help="Target language code.",
                        choices=lan_choices)

    parser.add_argument('--sys_prompt', type=str, default=None,
                        help='System prompt. If None, default one is used, depending on the language.')

    parser.add_argument('--init_prompt_src', type=str, default=None, help='Init translation with source text. It should be a complete sentence in the source language. '
                        'It can be context specific for the given input. Default is ')
    parser.add_argument('--init_prompt_tgt', type=str, default=None, help='Init translation with this target. It should be example translation of init_prompt_src. '
                        ' There is default init message, depending on the language.')

    parser.add_argument('--len-threshold', type=float, default=None, help='Ratio of the length of the source and generated target, in number of sentencepiece tokens. '
                        'It should reflect the target language and. If not set, no len-threshold is used.')

    parser.add_argument('--language-specific-len-threshold', default=False, action="store_true",
                        help='Use language-specific length threshold, e.g. 1.3 for German.')

    parser.add_argument("--max-context-length", type=int, default=4096, help="Maximum number of tokens in the model to use.")

    parser.add_argument("--buffer_trimming", type=str, default="sentences", choices=["segments","sentences"], help="Buffer trimming strategy.")

    parser.add_argument("--model-dir", type=str, default="ct2_EuroLLM-9B-Instruct/", help="ct2 model directory. If not set, the default ct2_EuroLLM-9B-Instruct/ is used.")
    parser.add_argument("--tokenizer-dir", type=str, default="EuroLLM-9B-Instruct/", help="tokenizer directory. If not set, the default EuroLLM-9B-Instruct/ is used.")


    parser.add_argument("-l", "--log-level", dest="log_level",
                        choices=['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'],
                        help="Set the log level", default='DEBUG')

def simulation_args(parser):
    #parser.add_argument('--input-instance', type=str, default=None, help="Filename of instances to simulate input. If not set, txt input is read from stdin.")
    parser.add_argument('--input-jsonl', type=str, default=None, help="Filename of jsonl file to simulate input. If not set, it is read from stdin.")
    #parser.add_argument('--output_instance', type=str, default=None, help="Write output as instance into this file, while also writing to stdout.")
    # maybe later
    #parser.add_argument('--offline', action="store_true", default=False, help='Offline mode.')
    parser.add_argument('--comp_unaware', action="store_true", default=False, help='Computationally unaware simulation.')


def simul_translator_factory(args):
    if args.sys_prompt is None:
        TgtLang = lan_to_name[args.tgt_lan]
        SrcLang = lan_to_name[args.src_lan]
        sys_prompt = default_prompt.format(SrcLang=SrcLang, TgtLang=TgtLang)
    else:
        sys_prompt = args.sys_prompt

    if args.init_prompt_src is None:

        if args.src_lan in default_inits_tgt and args.tgt_lan in default_inits_tgt:
            default_translations = default_inits_tgt
        else:
            default_translations = hovercraft_translations

        init_src = default_translations[args.src_lan].split()
        if args.init_prompt_tgt is None:
            init_tgt = default_translations[args.tgt_lan]
            if args.tgt_lan == "ja" and args.src_lan == "en":
                init_src = 'Please go ahead and start your presentation.'.split()
                print("WARNING: Default init_prompt_src not set, src_lan is English and tgt_lan is Japanese. The init_src prompt changed to be more verbose.", file=sys.stderr)
        else:
            print("WARNING: init_prompt_tgt is used, init_prompt_src is None, the default one. It may be wrong!", file=sys.stderr)
            init_tgt = args.init_prompt_tgt
    else:
        init_src = args.init_prompt_src.split()
        if args.init_prompt_tgt is None:
            print("WARNING: init_prompt_src is used, init_prompt_tgt is None, so the default one is used. It may be wrong!", file=sys.stderr)
            init_tgt = default_inits_tgt[args.tgt_lan]
        else:
            init_tgt = args.init_prompt_tgt

    print("INFO: System prompt:", sys_prompt, file=sys.stderr)
    print("INFO: Init prompt src:", init_src, file=sys.stderr)
    print("INFO: Init prompt tgt:", init_tgt, file=sys.stderr)

    if args.language_specific_len_threshold:
        if args.len_threshold is not None:
            print("ERROR: --len-threshold is set, but --language-specific-len-threshold is also set. Only one can be used.", file=sys.stderr)
            sys.exit(1)
        else:
            len_threshold = lan_thresholds[args.tgt_lan]
    else:
        len_threshold = args.len_threshold

    llmtrans = LLMTranslator(system_prompt=sys_prompt, max_context_length=args.max_context_length, len_ratio=len_threshold,
                             model_dir=args.model_dir, tokenizer_dir=args.tokenizer_dir)
    lan = args.tgt_lan if not args.tgt_lan.startswith("zh") else "zh"
    simul = SimulLLM(llmtrans,language=lan, min_len=args.min_len, chunk=args.min_chunk_size,
                    init_src=init_src, init_tgt=init_tgt, trimming=args.buffer_trimming
                    )
    return simul


class SimulationTimer:
    def __init__(self, comp_aware=True):
        self.beg_time = time.time()
        self.comp_aware = comp_aware

    def now(self, emission_time=None):
        if self.comp_aware:
            return time.time() - self.beg_time
        else:
            return emission_time

def format_outputs(out_seq, in_row, timer, is_final=False):
    for status, confirmed, unconfirmed in out_seq:
        #if status == "INCOMPLETE": continue
        r = {
            "emission_time": timer.now(in_row["emission_time"]),
            "end": in_row.get("end",None),
            "status": status,
            "text": confirmed,
            "unconfirmed_text": unconfirmed,
            "is_final": is_final
        }
        yield r

def handle_outputs(out_seq, in_row, timer, is_final=False):
    for r in format_outputs(out_seq, in_row, timer, is_final=is_final):
        print(json.dumps(r), flush=True)

def simulation_update(simul, rows, timer, out_handler=handle_outputs):
    # Insert all rows, then update.
    # Except of final rows, which are processed immediately.
    # TODO: experiment whether it's wise. It may accumulate delay in the worst case.
    inserted = False
    for row in rows:
        if "text" in row and row["text"] != "":
            print("INPUT:", row["text"], file=sys.stderr)
            words = row["text"].split()
            if not row["text"].startswith(" "):
                simul.insert_suffix(words[0])
                words = words[1:]
            simul.insert(words)
            inserted = True
        if row["is_final"]:
            if inserted:
                out = simul.process_iter(is_final=row["is_final"])
                out_handler(out, row, timer)
            out = simul.finish()
            out_handler(out, row, timer, is_final=True)
            simul.init()
            inserted = False
    if inserted:
        out = simul.process_iter(is_final=False) # if the last row is final, it was already processed.
        out_handler(out, row, timer)

def main_simulation_from_file():
    import argparse
    parser = argparse.ArgumentParser()
    translate_args(parser)
    simulation_args(parser)


    args = parser.parse_args()

    if not args.comp_unaware and args.input_jsonl is None:
        print(f"ERROR: Reading stdin in computationally aware simulation does not work. Loading the model breaks timing. Use --input-jsonl instead.", file=sys.stderr)
        sys.exit(1)


    simul = simul_translator_factory(args)

    if args.input_jsonl is not None:
        ifile = open(args.input_jsonl, "r")
        inform_ifile = args.input_jsonl
    else:
        ifile = sys.stdin
        inform_ifile = "stdin"

    un = "un" if args.comp_unaware else ""
    print(f"INFO: Reading {inform_ifile} in jsonl format, computationally {un}aware simulation.", file=sys.stderr)
    timer = SimulationTimer(comp_aware=not args.comp_unaware)
    if args.comp_unaware:
        for line in ifile:
            row = json.loads(line)
            simulation_update(simul, [row], timer)
    else:
#            # compuationally aware simulation from stdin:
             # it worked but did not make sense :(
#            eos = False
#            while not eos:
#                rows = []
#                # Check if stdin has data available *right now*
#                while select.select([sys.stdin], [], [], 0)[0]:
#                    line = sys.stdin.readline()
#                    if not line:  # end of input stream
#                        eos = True
#                        break
#                    rows.append(json.loads(line))
#                if rows:
#                    simulation_update(simul, rows, timer)

        # computationally aware simulation from file:
        rows = []
        for line in ifile:
            row = json.loads(line)
            # to allow cascading cascade, e.g. whisper->eurollm->eurollm:
            if "status" in row and row["status"] == "INCOMPLETE":
                continue
            rows.append(row)
            if timer.now() > row["emission_time"]:
                continue
            elif timer.now() <= row["emission_time"]:
                while timer.now() < row["emission_time"]:
                    time.sleep(0.01)
            simulation_update(simul, rows, timer)
            rows = []
        if rows:
            simulation_update(simul, rows, timer)

    if args.input_jsonl is not None:
        ifile.close()

if __name__ == "__main__":
    main_simulation_from_file()