Update main_process/salamandra_router.py
Browse files
main_process/salamandra_router.py
CHANGED
|
@@ -156,8 +156,6 @@ class Add_AD:
|
|
| 156 |
self.data = data
|
| 157 |
|
| 158 |
def __call__(self, state: NState, srt_original_silence, srt_original_silence_con_ad) -> NState:
|
| 159 |
-
print("Add_Ad.__call__ iniciado")
|
| 160 |
-
|
| 161 |
with open(srt_original_silence, "r", encoding="utf-8") as f:
|
| 162 |
srt_text = f.read()
|
| 163 |
|
|
@@ -302,8 +300,6 @@ class Add_AD:
|
|
| 302 |
|
| 303 |
class Add_Silence_AD:
|
| 304 |
def __call__(self, state: NState, srt_original_silence_con_ad, srt_original_silence_con_ad_silence) -> NState:
|
| 305 |
-
print("Add_Silence_AD.__call__ iniciado")
|
| 306 |
-
|
| 307 |
with open(srt_original_silence_con_ad, "r", encoding="utf-8") as f:
|
| 308 |
srt_text = f.read()
|
| 309 |
|
|
@@ -372,12 +368,12 @@ class Add_Silence_AD:
|
|
| 372 |
|
| 373 |
return state
|
| 374 |
|
| 375 |
-
def
|
| 376 |
-
if "(AD):" in
|
| 377 |
-
if "OCR:" in
|
| 378 |
return False
|
| 379 |
|
| 380 |
-
elif "[" in
|
| 381 |
return False
|
| 382 |
|
| 383 |
else:
|
|
@@ -388,8 +384,6 @@ def es_silencio(texto):
|
|
| 388 |
|
| 389 |
class Unir_AD_Silence:
|
| 390 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence, srt_original_silence_con_ad_silence_unidos) -> NState:
|
| 391 |
-
print("Unir_AD_Silence.__call__ iniciado")
|
| 392 |
-
|
| 393 |
with open(srt_original_silence_con_ad_silence, "r", encoding="utf-8") as f:
|
| 394 |
srt_text = f.read()
|
| 395 |
|
|
@@ -422,7 +416,7 @@ class Unir_AD_Silence:
|
|
| 422 |
while i < len(srt_blocks):
|
| 423 |
actual = srt_blocks[i]
|
| 424 |
|
| 425 |
-
if
|
| 426 |
origenes = [i]
|
| 427 |
start_time = actual["start"]
|
| 428 |
end_time = actual["end"]
|
|
@@ -430,7 +424,7 @@ class Unir_AD_Silence:
|
|
| 430 |
texto_ocr = ocr_text[i]
|
| 431 |
texto_descripcion = descripcion[i]
|
| 432 |
|
| 433 |
-
while j < len(srt_blocks) and
|
| 434 |
end_time = srt_blocks[j]["end"]
|
| 435 |
origenes.append(j)
|
| 436 |
texto_ocr += "" + ocr_text[j]
|
|
@@ -479,8 +473,6 @@ class Unir_AD_Silence:
|
|
| 479 |
|
| 480 |
class Unir_AD_Silences_a_ADs:
|
| 481 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence_unidos_silence, srt_original_silence_con_ad_silence_unidos_silence_general) -> NState:
|
| 482 |
-
print("Unir_AD_Silences_a_ADs.__call__ iniciado")
|
| 483 |
-
|
| 484 |
with open(srt_original_silence_con_ad_silence_unidos_silence, "r", encoding="utf-8") as f:
|
| 485 |
srt_text = f.read()
|
| 486 |
|
|
@@ -514,7 +506,7 @@ class Unir_AD_Silences_a_ADs:
|
|
| 514 |
|
| 515 |
if "(AD):" in block["text"]:
|
| 516 |
|
| 517 |
-
if
|
| 518 |
if i!=0 and ("(AD): OCR:" in srt_blocks[i-1]["text"]):
|
| 519 |
continue
|
| 520 |
|
|
@@ -533,11 +525,11 @@ class Unir_AD_Silences_a_ADs:
|
|
| 533 |
|
| 534 |
elif "(AD): OCR:" in block["text"]:
|
| 535 |
|
| 536 |
-
if i!=0 and
|
| 537 |
start_time = srt_blocks[i-1]["start"]
|
| 538 |
antes = True
|
| 539 |
|
| 540 |
-
if i!= len(srt_blocks)-1 and
|
| 541 |
end_time = srt_blocks[i+1]["end"]
|
| 542 |
despues = True
|
| 543 |
|
|
@@ -627,7 +619,6 @@ def words_silence_srt(srt_silence_path):
|
|
| 627 |
|
| 628 |
class Introduccion_OCR:
|
| 629 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence_unidos_silence_general, srt_original_silence_con_ad_silence_unidos_silence_general_ocr):
|
| 630 |
-
print("Introduccion_OCR.__call__ iniciat")
|
| 631 |
|
| 632 |
words_silence = words_silence_srt(srt_original_silence_con_ad_silence_unidos_silence_general)
|
| 633 |
|
|
@@ -709,7 +700,6 @@ class Introduccion_OCR:
|
|
| 709 |
|
| 710 |
class Identity_Manager:
|
| 711 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr, srt_original_silence_con_ad_ocr_identity):
|
| 712 |
-
print("Identity_Manager.__call__ iniciat")
|
| 713 |
|
| 714 |
with open(srt_original_silence_con_ad_ocr, "r", encoding="utf-8-sig") as f:
|
| 715 |
srt_text = f.read()
|
|
@@ -792,7 +782,6 @@ class Identity_Manager:
|
|
| 792 |
|
| 793 |
class UNE_Actor_prev:
|
| 794 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr_identity, srt_original_silence_con_ad_ocr_identity_une_1):
|
| 795 |
-
print("UNE_Actor_prev.__call__ iniciado")
|
| 796 |
|
| 797 |
with open(srt_original_silence_con_ad_ocr_identity, "r", encoding="utf-8-sig") as f:
|
| 798 |
srt_text = f.read()
|
|
@@ -880,7 +869,6 @@ class UNE_Actor_prev:
|
|
| 880 |
|
| 881 |
class UNE_Actor:
|
| 882 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr_identity_une_1, srt_original_silence_con_ad_ocr_identity_une_2):
|
| 883 |
-
print("UNE_Actor.__call__ iniciado")
|
| 884 |
|
| 885 |
silence_dict = words_silence_srt(srt_original_silence_con_ad_ocr_identity_une_1)
|
| 886 |
|
|
@@ -922,7 +910,6 @@ class UNE_Actor:
|
|
| 922 |
|
| 923 |
class Valoracion_Final:
|
| 924 |
def __call__(self, state, srt_original_silence_con_ad_ocr_identity_une_2, csv_evaluacion):
|
| 925 |
-
print("Valoracion_Final.__call__ iniciat")
|
| 926 |
|
| 927 |
# Llegeix el contingut del fitxer SRT
|
| 928 |
with open(srt_original_silence_con_ad_ocr_identity_une_2, "r", encoding="utf-8-sig") as f:
|
|
|
|
| 156 |
self.data = data
|
| 157 |
|
| 158 |
def __call__(self, state: NState, srt_original_silence, srt_original_silence_con_ad) -> NState:
|
|
|
|
|
|
|
| 159 |
with open(srt_original_silence, "r", encoding="utf-8") as f:
|
| 160 |
srt_text = f.read()
|
| 161 |
|
|
|
|
| 300 |
|
| 301 |
class Add_Silence_AD:
|
| 302 |
def __call__(self, state: NState, srt_original_silence_con_ad, srt_original_silence_con_ad_silence) -> NState:
|
|
|
|
|
|
|
| 303 |
with open(srt_original_silence_con_ad, "r", encoding="utf-8") as f:
|
| 304 |
srt_text = f.read()
|
| 305 |
|
|
|
|
| 368 |
|
| 369 |
return state
|
| 370 |
|
| 371 |
+
def is_silence(text):
|
| 372 |
+
if "(AD):" in text:
|
| 373 |
+
if "OCR:" in text:
|
| 374 |
return False
|
| 375 |
|
| 376 |
+
elif "[" in text:
|
| 377 |
return False
|
| 378 |
|
| 379 |
else:
|
|
|
|
| 384 |
|
| 385 |
class Unir_AD_Silence:
|
| 386 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence, srt_original_silence_con_ad_silence_unidos) -> NState:
|
|
|
|
|
|
|
| 387 |
with open(srt_original_silence_con_ad_silence, "r", encoding="utf-8") as f:
|
| 388 |
srt_text = f.read()
|
| 389 |
|
|
|
|
| 416 |
while i < len(srt_blocks):
|
| 417 |
actual = srt_blocks[i]
|
| 418 |
|
| 419 |
+
if is_silence(actual["text"]) and "(AD):" in actual["text"]:
|
| 420 |
origenes = [i]
|
| 421 |
start_time = actual["start"]
|
| 422 |
end_time = actual["end"]
|
|
|
|
| 424 |
texto_ocr = ocr_text[i]
|
| 425 |
texto_descripcion = descripcion[i]
|
| 426 |
|
| 427 |
+
while j < len(srt_blocks) and is_silence(srt_blocks[j]["text"]) and "(AD):" in srt_blocks[j]["text"]:
|
| 428 |
end_time = srt_blocks[j]["end"]
|
| 429 |
origenes.append(j)
|
| 430 |
texto_ocr += "" + ocr_text[j]
|
|
|
|
| 473 |
|
| 474 |
class Unir_AD_Silences_a_ADs:
|
| 475 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence_unidos_silence, srt_original_silence_con_ad_silence_unidos_silence_general) -> NState:
|
|
|
|
|
|
|
| 476 |
with open(srt_original_silence_con_ad_silence_unidos_silence, "r", encoding="utf-8") as f:
|
| 477 |
srt_text = f.read()
|
| 478 |
|
|
|
|
| 506 |
|
| 507 |
if "(AD):" in block["text"]:
|
| 508 |
|
| 509 |
+
if is_silence(block["text"]):
|
| 510 |
if i!=0 and ("(AD): OCR:" in srt_blocks[i-1]["text"]):
|
| 511 |
continue
|
| 512 |
|
|
|
|
| 525 |
|
| 526 |
elif "(AD): OCR:" in block["text"]:
|
| 527 |
|
| 528 |
+
if i!=0 and is_silence(srt_blocks[i-1]["text"]):
|
| 529 |
start_time = srt_blocks[i-1]["start"]
|
| 530 |
antes = True
|
| 531 |
|
| 532 |
+
if i!= len(srt_blocks)-1 and is_silence(srt_blocks[i+1]["text"]):
|
| 533 |
end_time = srt_blocks[i+1]["end"]
|
| 534 |
despues = True
|
| 535 |
|
|
|
|
| 619 |
|
| 620 |
class Introduccion_OCR:
|
| 621 |
def __call__(self, state: NState, srt_original_silence_con_ad_silence_unidos_silence_general, srt_original_silence_con_ad_silence_unidos_silence_general_ocr):
|
|
|
|
| 622 |
|
| 623 |
words_silence = words_silence_srt(srt_original_silence_con_ad_silence_unidos_silence_general)
|
| 624 |
|
|
|
|
| 700 |
|
| 701 |
class Identity_Manager:
|
| 702 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr, srt_original_silence_con_ad_ocr_identity):
|
|
|
|
| 703 |
|
| 704 |
with open(srt_original_silence_con_ad_ocr, "r", encoding="utf-8-sig") as f:
|
| 705 |
srt_text = f.read()
|
|
|
|
| 782 |
|
| 783 |
class UNE_Actor_prev:
|
| 784 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr_identity, srt_original_silence_con_ad_ocr_identity_une_1):
|
|
|
|
| 785 |
|
| 786 |
with open(srt_original_silence_con_ad_ocr_identity, "r", encoding="utf-8-sig") as f:
|
| 787 |
srt_text = f.read()
|
|
|
|
| 869 |
|
| 870 |
class UNE_Actor:
|
| 871 |
def __call__(self, state: NState, srt_original_silence_con_ad_ocr_identity_une_1, srt_original_silence_con_ad_ocr_identity_une_2):
|
|
|
|
| 872 |
|
| 873 |
silence_dict = words_silence_srt(srt_original_silence_con_ad_ocr_identity_une_1)
|
| 874 |
|
|
|
|
| 910 |
|
| 911 |
class Valoracion_Final:
|
| 912 |
def __call__(self, state, srt_original_silence_con_ad_ocr_identity_une_2, csv_evaluacion):
|
|
|
|
| 913 |
|
| 914 |
# Llegeix el contingut del fitxer SRT
|
| 915 |
with open(srt_original_silence_con_ad_ocr_identity_une_2, "r", encoding="utf-8-sig") as f:
|