Spaces:

innoai
/

svg2png_api

Running

App Files Files Community

innoai commited on 27 days ago

Commit

9be3968

verified ·

1 Parent(s): 815bc09

Update main.py

Browse files

Files changed (1) hide show

main.py +57 -11

main.py CHANGED Viewed

@@ -32,6 +32,12 @@ import urllib.parse
 from fastapi import FastAPI, File, Form, HTTPException, UploadFile
 from fastapi.responses import FileResponse, JSONResponse
 ###############################################################################
 # 1. Inkscape 检测
 ###############################################################################
@@ -73,21 +79,61 @@ def ensure_inkscape_available() -> tuple[bool, str]:
         return False, "未找到 Inkscape，请安装或手动加入 PATH"
 ###############################################################################
-# 2. URL 规范化（解决中文 / 空格 / () 等字符）
 ###############################################################################
 def normalize_url(url: str) -> str:
     """
-    将包含非 ASCII 字符的 URL 转为合法百分号编码格式
     """
-    parsed = urllib.parse.urlparse(url)
-    # 域名 IDNA（如有中文）
-    netloc = parsed.netloc.encode("idna").decode("ascii")
-    # 路径 / 查询 / 片段 百分号转义
-    path     = urllib.parse.quote(parsed.path, safe="/")
-    params   = urllib.parse.quote(parsed.params, safe=":&=")
-    query    = urllib.parse.quote_plus(parsed.query, safe="=&")
-    fragment = urllib.parse.quote(parsed.fragment, safe="")
-    return urllib.parse.urlunparse((parsed.scheme, netloc, path, params, query, fragment))
 ###############################################################################
 # 3. 下载并嵌入外链图片

 from fastapi import FastAPI, File, Form, HTTPException, UploadFile
 from fastapi.responses import FileResponse, JSONResponse
+# 导入字体安装函数
+from install_fonts import install_fonts_from_repository
+# 安装字体
+install_fonts_from_repository()
 ###############################################################################
 # 1. Inkscape 检测
 ###############################################################################
         return False, "未找到 Inkscape，请安装或手动加入 PATH"
 ###############################################################################
+# 2. URL 规范化：解决中文 / 空格 / () 等字符
 ###############################################################################
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+URL 规范化工具函数
+-----------------
+功能特点
+1. 支持中文域名及路径：自动在域名处使用 IDNA(Punycode)，在路径等位置做 % 编码
+2. **幂等**：已处理过的 URL 再次调用本函数不会出现二次编码
+3. 兼容常见 URL 组件：scheme、netloc、path、params、query、fragment
+"""
+import urllib.parse as _url
 def normalize_url(url: str) -> str:
     """
+    将包含中文或其它非 ASCII 字符的 URL 规范化为合法、安全的形式
+    参数:
+        url (str): 原始 URL，可能含中文、空格、圆括号等字符
+    返回:
+        str: 规范化后的 URL，可多次调用而结果保持一致
     """
+    # 解析 URL 各组件
+    parsed = _url.urlparse(url)
+    # -------------------------- 1) 处理域名 --------------------------
+    netloc = parsed.netloc
+    try:
+        # 若 netloc 已是 ASCII（含 Punycode）则无需转换
+        netloc.encode("ascii")
+    except UnicodeEncodeError:
+        # 含非 ASCII 字符时才按 IDNA 转为 Punycode
+        netloc = netloc.encode("idna").decode("ascii")
+    # -------------------------- 2) 处理路径等 ------------------------
+    # 先 unquote 再 quote，可避免二次编码
+    path     = _url.quote(_url.unquote(parsed.path),     safe="/")
+    params   = _url.quote(_url.unquote(parsed.params),   safe=":&=")
+    # query 使用 quote_plus 处理空格(+)，同时保留 & =
+    query    = _url.quote_plus(_url.unquote_plus(parsed.query), safe="=&")
+    fragment = _url.quote(_url.unquote(parsed.fragment), safe="")
+    # -------------------------- 3) 重新组装 -------------------------
+    return _url.urlunparse((
+        parsed.scheme,
+        netloc,
+        path,
+        params,
+        query,
+        fragment,
+    ))
 ###############################################################################
 # 3. 下载并嵌入外链图片