Spaces:

OrganizedProgrammers
/

ETSIDocFinder

Sleeping

App Files Files Community

om4r932 commited on 4 days ago

Commit

2cdd1ea

1 Parent(s): 9f149f3

Removed comments + add specifications + add batch search

Browse files

Files changed (3) hide show

app.py +98 -287
static/script.js +96 -96
templates/index.html +6 -6

app.py CHANGED Viewed

@@ -41,135 +41,29 @@ app.add_middleware(
     allow_headers=["*"],
 )
-# def get_text(specification: str, version: str):
-#     """Récupère les bytes du PDF à partir d'une spécification et d'une version."""
-#     doc_id = specification
-#     series = doc_id.split(".")[0]
-#     response = requests.get(
-#         f"https://www.3gpp.org/ftp/Specs/archive/{series}_series/{doc_id}/{doc_id.replace('.', '')}-{version}.zip",
-#         verify=False,
-#         headers={"User-Agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'}
-#     )
-#     if response.status_code != 200:
-#         raise Exception(f"Téléchargement du ZIP échoué pour {specification}-{version}")
-#     zip_bytes = io.BytesIO(response.content)
-#     with zipfile.ZipFile(zip_bytes) as zf:
-#         for file_name in zf.namelist():
-#             if file_name.endswith("zip"):
-#                 print("Another ZIP !")
-#                 zip_bytes = io.BytesIO(zf.read(file_name))
-#                 zf = zipfile.ZipFile(zip_bytes)
-#                 for file_name2 in zf.namelist():
-#                     if file_name2.endswith("doc") or file_name2.endswith("docx"):
-#                         if "cover" in file_name2.lower():
-#                             print("COVER !")
-#                             continue
-#                         ext = file_name2.split(".")[-1]
-#                         doc_bytes = zf.read(file_name2)
-#                         temp_id = str(uuid.uuid4())
-#                         input_path = f"/tmp/{temp_id}.{ext}"
-#                         output_path = f"/tmp/{temp_id}.txt"
-#                         with open(input_path, "wb") as f:
-#                             f.write(doc_bytes)
-#                         subprocess.run([
-#                             "libreoffice",
-#                             "--headless",
-#                             "--convert-to", "txt",
-#                             "--outdir", "/tmp",
-#                             input_path
-#                         ], check=True)
-#                         with open(output_path, "r") as f:
-#                             txt_data = [line.strip() for line in f if line.strip()]
-#                         os.remove(input_path)
-#                         os.remove(output_path)
-#                         return txt_data
-#             elif file_name.endswith("doc") or file_name.endswith("docx"):
-#                 if "cover" in file_name.lower():
-#                     print("COVER !")
-#                     continue
-#                 ext = file_name.split(".")[-1]
-#                 doc_bytes = zf.read(file_name)
-#                 temp_id = str(uuid.uuid4())
-#                 input_path = f"/tmp/{temp_id}.{ext}"
-#                 output_path = f"/tmp/{temp_id}.txt"
-#                 print("Ecriture")
-#                 with open(input_path, "wb") as f:
-#                     f.write(doc_bytes)
-#                 print("Convertissement")
-#                 subprocess.run([
-#                     "libreoffice",
-#                     "--headless",
-#                     "--convert-to", "txt",
-#                     "--outdir", "/tmp",
-#                     input_path
-#                 ], check=True)
-#                 print("Ecriture TXT")
-#                 with open(output_path, "r", encoding="utf-8") as f:
-#                     txt_data = [line.strip() for line in f if line.strip()]
-#                 os.remove(input_path)
-#                 os.remove(output_path)
-#                 return txt_data
-#     raise Exception(f"Aucun fichier .doc/.docx trouvé dans le ZIP pour {specification}-{version}")
-# def get_scope(specification: str, version: str):
-#     try:
-#         spec_text = get_text(specification, version)
-#         scp_i = 0
-#         nxt_i = 0
-#         for x in range(len(spec_text)):
-#             text = spec_text[x]
-#             if re.search(r"scope$", text, flags=re.IGNORECASE):
-#                 scp_i = x
-#                 nxt_i = scp_i + 10
-#             if re.search(r"references$", text, flags=re.IGNORECASE):
-#                 nxt_i = x
-#         return re.sub(r"\s+", " ", " ".join(spec_text[scp_i+1:nxt_i])) if len(spec_text[scp_i+1:nxt_i]) < 2 else "Not found"
-#     except Exception as e:
-#         traceback.print_exception(e)
-#         return "Not found (error)"
 class DocRequest(BaseModel):
     doc_id: str
 class DocResponse(BaseModel):
     doc_id: str
     url: str
     scope: Optional[str] = None
     search_time: float
-# class BatchDocRequest(BaseModel):
-#     doc_ids: List[str]
-#     release: Optional[int] = None
-# class BatchDocResponse(BaseModel):
-#     results: Dict[str, str]
-#     missing: List[str]
-#     search_time: float
-# class KeywordRequest(BaseModel):
-#     keywords: str
-#     release: Optional[str] = None
-#     wg: Optional[str] = None
-#     spec_type: Optional[Literal["TS", "TR"]] = None
-#     mode: Optional[Literal["and", "or"]] = "and"
-# class KeywordResponse(BaseModel):
-#     results: List[Dict[str, str]]
-#     search_time: float
 class DocFinder:
     def __init__(self):
@@ -230,179 +124,96 @@ class DocFinder:
                 return self.indexer[doc]
         main_tsg, workgroup, doc = self.get_workgroup(doc_id)
         if main_tsg:
             wg_url = self.find_workgroup_url(main_tsg, workgroup)
             if wg_url:
                 files = self.get_docs_from_url(wg_url)
                 for f in files:
                     if doc in f.lower() or original in f:
                         doc_url = f"{wg_url}/{f}"
                         self.indexer[original] = doc_url
                         self.save_indexer()
-                        return doc_url
-        return f"Document {doc_id} not found"
-# class DocFinder:
-#     def __init__(self):
-#         self.main_ftp_url = "https://www.3gpp.org/ftp"
-#         self.indexer_file = "indexed_docs.json"
-#         self.indexer, self.last_indexer_date = self.load_indexer()
-#     def load_indexer(self):
-#         """Load existing index if available"""
-#         if os.path.exists(self.indexer_file):
-#             with open(self.indexer_file, "r", encoding="utf-8") as f:
-#                 x = json.load(f)
-#                 return x["docs"], x["last_indexed_date"]
-#         return {}, None
-#     def save_indexer(self):
-#         """Save the updated index"""
-#         self.last_indexer_date = today.strftime("%d/%m/%Y-%H:%M:%S")
-#         with open(self.indexer_file, "w", encoding="utf-8") as f:
-#             today = datetime.today()
-#             output = {"docs": self.indexer, "last_indexed_date": self.last_indexer_date}
-#             json.dump(output, f, indent=4, ensure_ascii=False)
-#     def get_workgroup(self, doc):
-#         main_tsg = "tsg_ct" if doc[0] == "C" else "tsg_sa" if doc[0] == "S" else None
-#         if main_tsg is None:
-#             return None, None, None
-#         workgroup = f"WG{int(doc[1])}" if doc[1].isnumeric() else main_tsg.upper()
-#         return main_tsg, workgroup, doc
-#     def find_workgroup_url(self, main_tsg, workgroup):
-#         """Find the URL for the specific workgroup"""
-#         response = requests.get(f"{self.main_ftp_url}/{main_tsg}", verify=False)
-#         soup = BeautifulSoup(response.text, 'html.parser')
-#         for item in soup.find_all("tr"):
-#             link = item.find("a")
-#             if link and workgroup in link.get_text():
-#                 return f"{self.main_ftp_url}/{main_tsg}/{link.get_text()}"
-#         return f"{self.main_ftp_url}/{main_tsg}/{workgroup}"
-#     def get_docs_from_url(self, url):
-#         """Get list of documents/directories from a URL"""
-#         try:
-#             response = requests.get(url, verify=False, timeout=10)
-#             soup = BeautifulSoup(response.text, "html.parser")
-#             return [item.get_text() for item in soup.select("tr td a")]
-#         except Exception as e:
-#             print(f"Error accessing {url}: {e}")
-#             return []
-#     def search_document(self, doc_id: str, release=None):
-#         original_id = doc_id
-#         if original_id in self.indexer:
-#             return self.indexer[original_id]
-#         for doc in self.indexer:
-#             if doc.startswith(original_id):
-#                 return self.indexer[doc]
-#         # 2. Recherche live "classique" (TSG/CT)
-#         main_tsg, workgroup, doc = self.get_workgroup(doc_id)
-#         if main_tsg:
-#             wg_url = self.find_workgroup_url(main_tsg, workgroup)
-#             if wg_url:
-#                 meeting_folders = self.get_docs_from_url(wg_url)
-#                 for folder in meeting_folders:
-#                     meeting_url = f"{wg_url}/{folder}"
-#                     meeting_contents = self.get_docs_from_url(meeting_url)
-#                     key = "docs" if "docs" in [x.lower() for x in meeting_contents] else "tdocs" if "tdocs" in [x.lower() for x in meeting_contents] else None
-#                     if key is not None:
-#                         docs_url = f"{meeting_url}/{key}"
-#                         files = self.get_docs_from_url(docs_url)
-#                         for file in files:
-#                             if doc in file.lower() or original_id in file:
-#                                 doc_url = f"{docs_url}/{file}"
-#                                 self.indexer[original_id] = doc_url
-#                                 return doc_url
-#                         # ZIP subfolder
-#                         if "zip" in [x for x in files]:
-#                             zip_url = f"{docs_url}/zip"
-#                             zip_files = self.get_docs_from_url(zip_url)
-#                             for file in zip_files:
-#                                 if doc in file.lower() or original_id in file:
-#                                     doc_url = f"{zip_url}/{file}"
-#                                     self.indexer[original_id] = doc_url
-#                                     self.save_indexer()
-#                                     return doc_url
-#         # 3. Dernier recours : tenter dans /ftp/workshop (recherche live)
-#         workshop_url = f"{self.main_ftp_url}/workshop"
-#         meetings = self.get_docs_from_url(workshop_url)
-#         for meeting in meetings:
-#             if meeting in ['./', '../']:
-#                 continue
-#             meeting_url = f"{workshop_url}/{meeting}"
-#             contents = self.get_docs_from_url(meeting_url)
-#             for sub in contents:
-#                 if sub.lower() in ['docs', 'tdocs']:
-#                     docs_url = f"{meeting_url}/{sub}"
-#                     files = self.get_docs_from_url(docs_url)
-#                     for file in files:
-#                         if doc_id.lower() in file.lower() or original_id in file:
-#                             doc_url = f"{docs_url}/{file}"
-#                             self.indexer[original_id] = doc_url
-#                             self.save_indexer()
-#                             return doc_url
-#                     if "zip" in [x.lower() for x in files]:
-#                         zip_url = f"{docs_url}/zip"
-#                         zip_files = self.get_docs_from_url(zip_url)
-#                         for file in zip_files:
-#                             if doc_id.lower() in file.lower() or original_id in file:
-#                                 doc_url = f"{zip_url}/{file}"
-#                                 self.indexer[original_id] = doc_url
-#                                 self.save_indexer()
-#                                 return doc_url
-#         return f"Document {doc_id} not found"
 @app.get("/")
 async def main_menu():
     return FileResponse(os.path.join("templates", "index.html"))
-# @app.post("/search-spec", response_model=KeywordResponse)
-# def search_spec(request: KeywordRequest):
-#     start_time = time.time()
-#     kws = [_.lower() for _ in request.keywords.split(" ")]
-#     results = []
-#     for string, spec in finder_spec.indexer_specs.items():
-#         if request.mode == "and":
-#             if not all(kw in string.lower() for kw in kws):
-#                 continue
-#         elif request.mode == "or":
-#             if not any(kw in string.lower() for kw in kws):
-#                 continue
-#         release = request.release
-#         working_group = request.wg
-#         spec_type = request.spec_type
-#         if spec.get('version', None) is None or (release is not None and spec["version"].split(".")[0] != str(release)):
-#             continue
-#         if spec.get('working_group', None) is None or (working_group is not None and spec["working_group"] != working_group):
-#             continue
-#         if spec_type is not None and spec["type"] != spec_type:
-#             continue
-#         results.append(spec)
-#     if len(results) > 0:
-#         return KeywordResponse(
-#             results=results,
-#             search_time=time.time() - start_time
-#         )
-#     else:
-#         raise HTTPException(status_code=404, detail="Specifications not found")
-finder = DocFinder()
-@app.post("/find", response_model=DocResponse)
 def find_document(request: DocRequest):
     start_time = time.time()
     result = finder.search_document(request.doc_id)
     if "not found" not in result and "Could not" not in result and "Unable" not in result:
@@ -410,27 +221,27 @@ def find_document(request: DocRequest):
             doc_id=request.doc_id,
             url=result,
             search_time=time.time() - start_time
-        )
     else:
         raise HTTPException(status_code=404, detail=result)
-# @app.post("/batch", response_model=BatchDocResponse)
-# def find_documents_batch(request: BatchDocRequest):
-#     start_time = time.time()
-#     results = {}
-#     missing = []
-#     for doc_id in request.doc_ids:
-#         finder = finder_tsg if doc_id[0].isalpha() else finder_spec
-#         result = finder.search_document(doc_id)
-#         if "not found" not in result and "Could not" not in result and "Unable" not in result:
-#             results[doc_id] = result
-#         else:
-#             missing.append(doc_id)
-#     return BatchDocResponse(
-#         results=results,
-#         missing=missing,
-#         search_time=time.time() - start_time
-#     )

     allow_headers=["*"],
 )
 class DocRequest(BaseModel):
     doc_id: str
 class DocResponse(BaseModel):
     doc_id: str
     url: str
+    release: Optional[str] = None
     scope: Optional[str] = None
     search_time: float
+class MultiDocResponse(BaseModel):
+    doc_id: str
+    results: List[DocResponse]
+    search_time: float
+class BatchDocRequest(BaseModel):
+    doc_ids: List[str]
+    release: Optional[int] = None
+class BatchDocResponse(BaseModel):
+    results: Dict[str, str]
+    missing: List[str]
+    search_time: float
 class DocFinder:
     def __init__(self):
                 return self.indexer[doc]
         main_tsg, workgroup, doc = self.get_workgroup(doc_id)
+        urls = []
         if main_tsg:
             wg_url = self.find_workgroup_url(main_tsg, workgroup)
             if wg_url:
                 files = self.get_docs_from_url(wg_url)
                 for f in files:
                     if doc in f.lower() or original in f:
+                        print(f)
                         doc_url = f"{wg_url}/{f}"
                         self.indexer[original] = doc_url
                         self.save_indexer()
+                        urls.append(doc_url)
+        return urls[0] if len(urls) == 1 else urls[-2] if len(urls) > 1 else f"Document {doc_id} not found"
+class SpecFinder:
+    def __init__(self):
+        self.main_url = "https://www.etsi.org/deliver/etsi_ts"
+        self.indexer_file = "indexed_specifications.json"
+        self.indexer, self.last_indexer_date = self.load_indexer()
+        self.headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/136.0.0.0 Safari/537.36"}
+    def load_indexer(self):
+        if os.path.exists(self.indexer_file):
+            with open(self.indexer_file, "r", encoding="utf-8") as f:
+                x = json.load(f)
+                return x["specs"], x["last_indexed_date"]
+        return {}, None
+    def save_indexer(self):
+        today = datetime.today()
+        self.last_indexer_date = today.strftime("%d/%m/%Y-%H:%M:%S")
+        with open(self.indexer_file, "w", encoding="utf-8") as f:
+            output = {"specs": self.indexer, "last_indexed_date": self.last_indexer_date}
+            json.dump(output, f, indent=4, ensure_ascii=False)
+    def get_spec_path(self, doc_id: str):
+        if "-" in doc_id:
+            position, part = doc_id.split("-")
+        else:
+            position, part = doc_id, None
+        position = position.replace(" ", "")
+        if part:
+            if len(part) == 1:
+                part = "0" + part
+        spec_folder = position + part if part is not None else position
+        return f"{int(position) - (int(position)%100)}_{int(position) - (int(position)%100) + 99}/{spec_folder}"
+    def get_docs_from_url(self, url):
+        try:
+            response = requests.get(url, verify=False, timeout=15)
+            soup = BeautifulSoup(response.text, "html.parser")
+            docs = [item.get_text() for item in soup.find_all("a")][1:]
+            return docs
+        except Exception as e:
+            print(f"Error accessing {url}: {e}")
+            return []
+    def search_document(self, doc_id: str):
+        # Example : 103 666[-2 opt]
+        original = doc_id
+        if original in self.indexer:
+            return self.indexer[original]
+        for doc in self.indexer:
+            if doc.startswith(original):
+                return self.indexer[doc]
+        url = f"{self.main_url}/{self.get_spec_path(original)}/"
+        releases = self.get_docs_from_url(url)
+        files = self.get_docs_from_url(url + releases[-1])
+        for f in files:
+            if f.endswith(".pdf"):
+                return url + releases[-1] + "/" + f
+        return f"Specification {doc_id} not found"
 @app.get("/")
 async def main_menu():
     return FileResponse(os.path.join("templates", "index.html"))
+finder_doc = DocFinder()
+finder_spec = SpecFinder()
+@app.post("/find")
 def find_document(request: DocRequest):
     start_time = time.time()
+    finder = finder_spec if request.doc_id[0].isnumeric() else finder_doc
     result = finder.search_document(request.doc_id)
     if "not found" not in result and "Could not" not in result and "Unable" not in result:
             doc_id=request.doc_id,
             url=result,
             search_time=time.time() - start_time
+        ) if not isinstance(result, list) else result
     else:
         raise HTTPException(status_code=404, detail=result)
+@app.post("/batch", response_model=BatchDocResponse)
+def find_documents_batch(request: BatchDocRequest):
+    start_time = time.time()
+    results = {}
+    missing = []
+    for doc_id in request.doc_ids:
+        finder = finder_doc if doc_id[0].isalpha() else finder_spec
+        result = finder.search_document(doc_id)
+        if "not found" not in result and "Could not" not in result and "Unable" not in result:
+            results[doc_id] = result
+        else:
+            missing.append(doc_id)
+    return BatchDocResponse(
+        results=results,
+        missing=missing,
+        search_time=time.time() - start_time
+    )

static/script.js CHANGED Viewed

@@ -2,21 +2,21 @@
 const dynamicDesc = document.getElementById("dynamicDesc");
 const dynamicTitle = document.getElementById("dynamicTitle");
-// const singleModeBtn = document.getElementById('single-mode-btn');
-// const batchModeBtn = document.getElementById('batch-mode-btn');
 // const keywordModeBtn = document.getElementById("keyword-mode-btn");
 const singleInput = document.querySelector('.single-input');
-// const batchInput = document.querySelector('.batch-input');
 // const keywordSearchInput = document.querySelector(".keyword-input");
 const docIdInput = document.getElementById('doc-id');
-// const batchIdsInput = document.getElementById('batch-ids');
 // const keywordInput = document.getElementById("keywords");
 const searchBtn = document.getElementById('search-btn');
 const batchSearchBtn = document.getElementById('batch-search-btn');
-const keywordSearchBtn = document.getElementById("keyword-search-btn");
 const loader = document.getElementById('loader');
 const resultsContainer = document.getElementById('results-container');
@@ -25,31 +25,31 @@ const resultsStats = document.getElementById('results-stats');
 const errorMessage = document.getElementById('error-message');
 // Search mode toggle
-// singleModeBtn.addEventListener('click', () => {
-//     dynamicTitle.textContent = "Find 3GPP Documents";
-//     dynamicDesc.textContent = "Enter a TSG document ID / specification ID (e.g., S1-123456, C2-987654 or 31.102) to locate the document in the 3GPP FTP server.";
-//     singleModeBtn.classList.add('active');
-//     keywordModeBtn.classList.remove("active");
-//     batchModeBtn.classList.remove('active');
-//     singleInput.style.display = 'block';
-//     batchInput.style.display = 'none';
-//     keywordSearchInput.style.display = "none";
-// });
-// batchModeBtn.addEventListener('click', () => {
-//     dynamicTitle.textContent = "Find multiple 3GPP Documents";
-//     dynamicDesc.textContent = "Enter a list of TSG document ID / specification ID (e.g., S1-123456, C2-987654 or 31.102) to locate all of the specified documents in the 3GPP FTP server.";
-//     batchModeBtn.classList.add('active');
-//     keywordModeBtn.classList.remove("active");
-//     singleModeBtn.classList.remove('active');
-//     batchInput.style.display = 'block';
-//     keywordSearchInput.style.display = "none";
-//     singleInput.style.display = 'none';
-// });
 // keywordModeBtn.addEventListener('click', () => {
 //     dynamicTitle.textContent = "Search 3GPP specifications";
@@ -134,48 +134,48 @@ searchBtn.addEventListener('click', async () => {
 });
 // Batch document search
-// batchSearchBtn.addEventListener('click', async () => {
-//     const batchText = batchIdsInput.value.trim();
-//     if (!batchText) {
-//         showError('Please enter at least one document ID');
-//         return;
-//     }
-//     const docIds = batchText.split('\n')
-//         .map(id => id.trim())
-//         .filter(id => id !== '');
-//     if (docIds.length === 0) {
-//         showError('Please enter at least one valid document ID');
-//         return;
-//     }
-//     showLoader();
-//     hideError();
-//     try {
-//         const response = await fetch(`/batch`, {
-//             method: 'POST',
-//             headers: {
-//                 'Content-Type': 'application/json'
-//             },
-//             body: JSON.stringify({ doc_ids: docIds })
-//         });
-//         const data = await response.json();
-//         if (response.ok) {
-//             displayBatchResults(data);
-//         } else {
-//             showError('Error processing batch request');
-//         }
-//     } catch (error) {
-//         showError('Error connecting to the server. Please check if the API is running.');
-//         console.error('Error:', error);
-//     } finally {
-//         hideLoader();
-//     }
-// });
 // Display single result
 function displaySingleResult(data) {
@@ -246,45 +246,45 @@ function displaySingleNotFound(docId, message) {
 //     resultsContainer.style.display = 'block';
 // }
-// // Display batch results
-// function displayBatchResults(data) {
-//     resultsList.innerHTML = '';
-//     // Found documents
-//     Object.entries(data.results).forEach(([docId, url]) => {
-//         const resultItem = document.createElement('div');
-//         resultItem.className = 'result-item';
-//         resultItem.innerHTML = `
-//             <div class="result-header">
-//                 <div class="result-id">${docId}</div>
-//                 <div class="result-status status-found">Found</div>
-//             </div>
-//             <div class="result-url">
-//                 <a href="${url}" target="_blank">${url}</a>
-//             </div>
-//         `;
-//         resultsList.appendChild(resultItem);
-//     });
-//     // Not found documents
-//     data.missing.forEach(docId => {
-//         const resultItem = document.createElement('div');
-//         resultItem.className = 'result-item';
-//         resultItem.innerHTML = `
-//             <div class="result-header">
-//                 <div class="result-id">${docId}</div>
-//                 <div class="result-status status-not-found">Not Found</div>
-//             </div>
-//         `;
-//         resultsList.appendChild(resultItem);
-//     });
-//     const foundCount = Object.keys(data.results).length;
-//     const totalCount = foundCount + data.missing.length;
-//     resultsStats.textContent = `Found ${foundCount} of ${totalCount} documents in ${data.search_time.toFixed(2)} seconds`;
-//     resultsContainer.style.display = 'block';
-// }
 // Show loader
 function showLoader() {

 const dynamicDesc = document.getElementById("dynamicDesc");
 const dynamicTitle = document.getElementById("dynamicTitle");
+const singleModeBtn = document.getElementById('single-mode-btn');
+const batchModeBtn = document.getElementById('batch-mode-btn');
 // const keywordModeBtn = document.getElementById("keyword-mode-btn");
 const singleInput = document.querySelector('.single-input');
+const batchInput = document.querySelector('.batch-input');
 // const keywordSearchInput = document.querySelector(".keyword-input");
 const docIdInput = document.getElementById('doc-id');
+const batchIdsInput = document.getElementById('batch-ids');
 // const keywordInput = document.getElementById("keywords");
 const searchBtn = document.getElementById('search-btn');
 const batchSearchBtn = document.getElementById('batch-search-btn');
+// const keywordSearchBtn = document.getElementById("keyword-search-btn");
 const loader = document.getElementById('loader');
 const resultsContainer = document.getElementById('results-container');
 const errorMessage = document.getElementById('error-message');
 // Search mode toggle
+singleModeBtn.addEventListener('click', () => {
+    dynamicTitle.textContent = "Find ETSI Documents";
+    dynamicDesc.textContent = "Enter a SET/SCP/TS document ID to locate the document in the ETSI DocBox server.";
+    singleModeBtn.classList.add('active');
+    // keywordModeBtn.classList.remove("active");
+    batchModeBtn.classList.remove('active');
+    singleInput.style.display = 'block';
+    batchInput.style.display = 'none';
+    // keywordSearchInput.style.display = "none";
+});
+batchModeBtn.addEventListener('click', () => {
+    dynamicTitle.textContent = "Find multiple ETSI Documents";
+    dynamicDesc.textContent = "Enter a list of SET/SCP/TS document ID to locate all specified documents in the ETSI DocBox server.";
+    batchModeBtn.classList.add('active');
+    //keywordModeBtn.classList.remove("active");
+    singleModeBtn.classList.remove('active');
+    batchInput.style.display = 'block';
+    //keywordSearchInput.style.display = "none";
+    singleInput.style.display = 'none';
+});
 // keywordModeBtn.addEventListener('click', () => {
 //     dynamicTitle.textContent = "Search 3GPP specifications";
 });
 // Batch document search
+batchSearchBtn.addEventListener('click', async () => {
+    const batchText = batchIdsInput.value.trim();
+    if (!batchText) {
+        showError('Please enter at least one document ID');
+        return;
+    }
+    const docIds = batchText.split('\n')
+        .map(id => id.trim())
+        .filter(id => id !== '');
+    if (docIds.length === 0) {
+        showError('Please enter at least one valid document ID');
+        return;
+    }
+    showLoader();
+    hideError();
+    try {
+        const response = await fetch(`/batch`, {
+            method: 'POST',
+            headers: {
+                'Content-Type': 'application/json'
+            },
+            body: JSON.stringify({ doc_ids: docIds })
+        });
+        const data = await response.json();
+        if (response.ok) {
+            displayBatchResults(data);
+        } else {
+            showError('Error processing batch request');
+        }
+    } catch (error) {
+        showError('Error connecting to the server. Please check if the API is running.');
+        console.error('Error:', error);
+    } finally {
+        hideLoader();
+    }
+});
 // Display single result
 function displaySingleResult(data) {
 //     resultsContainer.style.display = 'block';
 // }
+// Display batch results
+function displayBatchResults(data) {
+    resultsList.innerHTML = '';
+    // Found documents
+    Object.entries(data.results).forEach(([docId, url]) => {
+        const resultItem = document.createElement('div');
+        resultItem.className = 'result-item';
+        resultItem.innerHTML = `
+            <div class="result-header">
+                <div class="result-id">${docId}</div>
+                <div class="result-status status-found">Found</div>
+            </div>
+            <div class="result-url">
+                <a href="${url}" target="_blank">${url}</a>
+            </div>
+        `;
+        resultsList.appendChild(resultItem);
+    });
+    // Not found documents
+    data.missing.forEach(docId => {
+        const resultItem = document.createElement('div');
+        resultItem.className = 'result-item';
+        resultItem.innerHTML = `
+            <div class="result-header">
+                <div class="result-id">${docId}</div>
+                <div class="result-status status-not-found">Not Found</div>
+            </div>
+        `;
+        resultsList.appendChild(resultItem);
+    });
+    const foundCount = Object.keys(data.results).length;
+    const totalCount = foundCount + data.missing.length;
+    resultsStats.textContent = `Found ${foundCount} of ${totalCount} documents in ${data.search_time.toFixed(2)} seconds`;
+    resultsContainer.style.display = 'block';
+}
 // Show loader
 function showLoader() {

templates/index.html CHANGED Viewed

@@ -20,31 +20,31 @@
         <div class="search-container">
             <div class="search-header">
                 <h2 id="dynamicTitle">Find ETSI Documents</h2>
-                <p id="dynamicDesc">Enter a SET/SCP document IDto locate the document in the ETSI DocBox server.</p>
             </div>
             <div class="search-mode">
                 <button id="single-mode-btn" class="active">Single Document</button>
-                <!-- <button id="batch-mode-btn">Batch Search</button>
-                <button id="keyword-mode-btn">Keyword Search</button> -->
             </div>
             <div class="search-form">
                 <div class="input-group single-input">
                     <label for="doc-id">Document ID</label>
                     <div class="input-field">
-                        <input type="text" id="doc-id" placeholder="Enter SET/SCP document ID (e.g. SETREQ(15)0015451r1, SCP(12)15151, SCPTEC(11)44754r3)">
                         <button id="search-btn" class="btn">Search</button>
                     </div>
                 </div>
-                <!-- <div class="input-group batch-input">
                     <label for="batch-ids">Document IDs or Specification IDs (one per line)</label>
                     <textarea id="batch-ids" placeholder="Enter document IDs or specification IDs, one per line (e.g., S1-123456, C2-987654, 31.102)"></textarea>
                     <div class="hint">Enter one document ID per line</div>
                     <button id="batch-search-btn" class="btn" style="margin-top: 10px;">Search All</button>
                 </div>
                 <div class="input-group keyword-input">
                     <label for="keywords">Keywords</label>
                     <div class="input-field">

         <div class="search-container">
             <div class="search-header">
                 <h2 id="dynamicTitle">Find ETSI Documents</h2>
+                <p id="dynamicDesc">Enter a SET/SCP/TS document ID to locate the document in the ETSI DocBox server.</p>
             </div>
             <div class="search-mode">
                 <button id="single-mode-btn" class="active">Single Document</button>
+                <button id="batch-mode-btn">Batch Search</button>
+                <!--<button id="keyword-mode-btn">Keyword Search</button> -->
             </div>
             <div class="search-form">
                 <div class="input-group single-input">
                     <label for="doc-id">Document ID</label>
                     <div class="input-field">
+                        <input type="text" id="doc-id" placeholder="Enter SET/SCP/TS document ID (e.g. SETREQ(15)0015451r1, SCP(12)15151, 103 666-2)">
                         <button id="search-btn" class="btn">Search</button>
                     </div>
                 </div>
+                <div class="input-group batch-input">
                     <label for="batch-ids">Document IDs or Specification IDs (one per line)</label>
                     <textarea id="batch-ids" placeholder="Enter document IDs or specification IDs, one per line (e.g., S1-123456, C2-987654, 31.102)"></textarea>
                     <div class="hint">Enter one document ID per line</div>
                     <button id="batch-search-btn" class="btn" style="margin-top: 10px;">Search All</button>
                 </div>
+                <!--
                 <div class="input-group keyword-input">
                     <label for="keywords">Keywords</label>
                     <div class="input-field">