File size: 7,388 Bytes
97260a5
 
8017292
 
 
 
 
97260a5
 
 
8017292
 
 
 
97260a5
 
 
 
 
 
 
 
 
 
105bad1
 
 
 
 
3f409fa
 
105bad1
 
 
 
 
 
 
 
 
97260a5
 
 
 
 
8017292
 
97260a5
3f409fa
97260a5
 
 
8017292
 
 
97260a5
 
8017292
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97260a5
 
8017292
105bad1
8017292
 
 
 
 
 
 
 
 
 
 
 
105bad1
 
97260a5
 
 
105bad1
97260a5
 
 
 
 
105bad1
 
97260a5
 
 
 
 
 
 
 
8017292
97260a5
105bad1
97260a5
8017292
 
 
97260a5
3f409fa
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97260a5
3f409fa
 
 
 
 
 
97260a5
 
3f409fa
97260a5
 
 
 
 
 
 
 
 
3f409fa
 
 
 
8017292
105bad1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97260a5
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
import json
import logging
import datetime
import time
import requests
import pytz
import unittest

import gradio as gr
from utils import process_json_files, flatten_text_with_line_breaks, calculate_tanach_statistics, build_word_index

import logging
from deep_translator import GoogleTranslator
from deep_translator.exceptions import NotValidLength, RequestError

# Set up logging
logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')

# Load Tanach text
TANACH_DATA = process_json_files(1, 39)
WORD_INDEX = build_word_index(TANACH_DATA)

# --- Utility Functions ---

def get_current_word_data(client_time_str):
    """Gets data about the current word based on the client's time."""
    try:
        client_time = datetime.datetime.strptime(client_time_str, "%H:%M:%S")
        total_seconds = int(client_time.strftime("%H")) * 3600 + \
                        int(client_time.strftime("%M")) * 60 + \
                        int(client_time.strftime("%S"))

        # Find the closest key in WORD_INDEX
        word_position = min(WORD_INDEX.keys(), key=lambda k: abs(k - total_seconds))

        return WORD_INDEX[word_position], word_position
    except Exception as e:
        logging.error(f"Error processing client time: {e}")
        return None, None

def get_formatted_verse(book_id, chapter_id, verse_id, highlight_word=True):
    """Returns a formatted verse with optional word highlighting."""
    chapter_text = TANACH_DATA[book_id]["text"][chapter_id]
    flattened_chapter = flatten_text_with_line_breaks(chapter_text)

    # Highlight the word *before* joining with <br>
    if highlight_word and 0 <= verse_id - 1 < len(flattened_chapter):
        flattened_chapter[verse_id - 1] = \
          f"<span class='highlight'>{flattened_chapter[verse_id - 1]}</span>"

    return '<br>'.join(flattened_chapter)


def translate_verse(hebrew_verse, highlight_word=True):
    """Translates a Hebrew verse to English, splitting into chunks if necessary."""
    try:
        translator = GoogleTranslator(source='iw', target='en')
        max_length = 2000  # Slightly below the limit to be safe
        translated_text = ""

        # Split the verse into chunks smaller than the max length
        chunks = [hebrew_verse[i:i + max_length] for i in range(0, len(hebrew_verse), max_length)]

        for chunk_index, chunk in enumerate(chunks):
            # Translate the current chunk
            translated_chunk = translator.translate(chunk)

            # If it's not the first chunk, find the last line break and start from there
            if chunk_index > 0:
                last_line_break = translated_chunk.rfind('<br>', 0, 100) # Find last <br> in first 100 chars
                if last_line_break != -1:
                    translated_text += translated_chunk[last_line_break + 4:] # Add from after <br>
                else:
                    translated_text += translated_chunk
            else:
                translated_text += translated_chunk

        return translated_text

    except RequestError as e:
        logging.warning(f"Translation failed: Request Error - {e}")
        return "Translation unavailable: Request Error"


# --- Gradio Interface ---

def update_tanach_display(client_time_str, timezone):
    """Updates the Gradio interface with client time, verse info, and translations."""
    try:
        # Get timezone offset using pytz
        tz = pytz.timezone(timezone)
        offset = tz.utcoffset(datetime.datetime.now()).total_seconds() / 3600  # Offset in hours

        # Adjust client time based on the timezone
        client_time_obj = datetime.datetime.strptime(client_time_str, "%H:%M:%S")
        client_time_obj = client_time_obj.replace(tzinfo=datetime.timezone(datetime.timedelta(hours=offset)))
        client_time_str = client_time_obj.strftime("%H:%M:%S")
    except Exception as e:
        logging.error(f"Error adjusting client time based on timezone: {e}")
        return "Error: Invalid Timezone", "", ""

    word_data, word_position = get_current_word_data(client_time_str)

    if word_data is None:
        logging.error(f"Word position {word_position} not found in index.")
        return "Error: Word not found", "", ""

    book_id = word_data["book_id"]
    chapter_id = word_data["chapter_id"]
    verse_id = word_data["verse_id"]

    logging.debug(f"Book ID: {book_id}, Chapter ID: {chapter_id}, Verse ID: {verse_id}")

    # Format verse information
    verse_info = f"""
    **{TANACH_DATA[book_id]['title']}**
    Chapter {chapter_id + 1}, Verse {verse_id}
    """

    # Get and format Hebrew and English verses
    hebrew_verse = get_formatted_verse(book_id, chapter_id, verse_id)
    english_verse = translate_verse('\n'.join(hebrew_verse.split('<br>')), highlight_word=False)

    return verse_info, hebrew_verse, english_verse


# --- Gradio Interface ---

with gr.Blocks(css="""
 .container {
 display: flex;
 flex-direction: column;
 align-items: center;
 font-family: 'Times New Roman', serif;
 }
 /* Add this highlight class styling */
 .highlight {
 background-color: #FFFF00; /* Yellow highlight */
 padding: 2px 5px;
 border-radius: 5px;
 }
 #verse-info {
 margin-bottom: 20px;
 text-align: center;
 }
 #verses {
 display: flex;
 flex-direction: row;
 justify-content: center;
 align-items: flex-start;
 gap: 50px;
 }
 #hebrew-verse {
 font-size: 18px;
 line-height: 1.5;
 margin-bottom: 20px;
 text-align: right;
 direction: rtl;
 }
 #english-verse {
 font-size: 18px;
 line-height: 1.5;
 margin-bottom: 20px;
 }
""") as iface:
    with gr.Row():
        timezone_input = gr.Dropdown(
          choices=[tz for tz in pytz.common_timezones],
          label="Select Your Timezone",
          value="UTC"  # Set a default timezone
        )

    with gr.Row():
        advance_button = gr.Button("Advance to Current Time")

    with gr.Row():
        verse_info_output = gr.Markdown(label="Verse Information", elem_id="verse-info")

    # Place Hebrew and English verses within a flex container
    with gr.Row(elem_id="verses"):
        hebrew_verse_output = gr.HTML(label="Hebrew Verse", elem_id="hebrew-verse")
        english_verse_output = gr.HTML(label="English Translation", elem_id="english-verse")

    # Update the display with verse information and translations when the button is clicked
    advance_button.click(
        fn=lambda tz: update_tanach_display(datetime.datetime.now(pytz.timezone(tz)).strftime("%H:%M:%S"), tz),
        inputs=[timezone_input],
        outputs=[verse_info_output, hebrew_verse_output, english_verse_output],
    )

class TestWordIndex(unittest.TestCase):
    def test_word_index_boundaries(self):
        # Test for 0:00:00
        word_data_start, _ = get_current_word_data("00:00:00")
        self.assertEqual(word_data_start["book_id"], 1)
        self.assertEqual(word_data_start["chapter_id"], 0)
        self.assertEqual(word_data_start["verse_id"], 1)

        # Test for 23:59:59
        word_data_end, _ = get_current_word_data("23:59:59")
        self.assertEqual(word_data_end["book_id"], 39)
        self.assertEqual(word_data_end["chapter_id"], 35)
        self.assertEqual(word_data_end["verse_id"], 23)

if __name__ == '__main__':
    # Run tests first
    suite = unittest.TestLoader().loadTestsFromTestCase(TestWordIndex)
    unittest.TextTestRunner().run(suite)

    iface.launch(share=True)