gui.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521
  1. import os
  2. import shutil
  3. import uuid
  4. import asyncio
  5. from asyncio import CancelledError
  6. from pathlib import Path
  7. from pdf2zh import __version__
  8. from pdf2zh.high_level import translate
  9. from pdf2zh.translator import (
  10. BaseTranslator,
  11. GoogleTranslator,
  12. BingTranslator,
  13. DeepLTranslator,
  14. DeepLXTranslator,
  15. OllamaTranslator,
  16. AzureOpenAITranslator,
  17. OpenAITranslator,
  18. ZhipuTranslator,
  19. SiliconTranslator,
  20. GeminiTranslator,
  21. AzureTranslator,
  22. TencentTranslator,
  23. DifyTranslator,
  24. AnythingLLMTranslator,
  25. )
  26. import gradio as gr
  27. from gradio_pdf import PDF
  28. import tqdm
  29. import requests
  30. import cgi
  31. service_map: dict[str, BaseTranslator] = {
  32. "Google": GoogleTranslator,
  33. "Bing": BingTranslator,
  34. "DeepL": DeepLTranslator,
  35. "DeepLX": DeepLXTranslator,
  36. "Ollama": OllamaTranslator,
  37. "AzureOpenAI": AzureOpenAITranslator,
  38. "OpenAI": OpenAITranslator,
  39. "Zhipu": ZhipuTranslator,
  40. "Silicon": SiliconTranslator,
  41. "Gemini": GeminiTranslator,
  42. "Azure": AzureTranslator,
  43. "Tencent": TencentTranslator,
  44. "Dify": DifyTranslator,
  45. "AnythingLLM": AnythingLLMTranslator,
  46. }
  47. lang_map = {
  48. "Chinese": "zh",
  49. "English": "en",
  50. "French": "fr",
  51. "German": "de",
  52. "Japanese": "ja",
  53. "Korean": "ko",
  54. "Russian": "ru",
  55. "Spanish": "es",
  56. "Italian": "it",
  57. }
  58. page_map = {
  59. "All": None,
  60. "First": [0],
  61. "First 5 pages": list(range(0, 5)),
  62. }
  63. flag_demo = False
  64. if os.getenv("PDF2ZH_DEMO"):
  65. flag_demo = True
  66. service_map = {
  67. "Google": GoogleTranslator,
  68. }
  69. page_map = {
  70. "First": [0],
  71. "First 20 pages": list(range(0, 20)),
  72. }
  73. client_key = os.getenv("PDF2ZH_CLIENT_KEY")
  74. server_key = os.getenv("PDF2ZH_SERVER_KEY")
  75. def verify_recaptcha(response):
  76. recaptcha_url = "https://www.google.com/recaptcha/api/siteverify"
  77. print("reCAPTCHA", server_key, response)
  78. data = {"secret": server_key, "response": response}
  79. result = requests.post(recaptcha_url, data=data).json()
  80. print("reCAPTCHA", result.get("success"))
  81. return result.get("success")
  82. def download_with_limit(url, save_path, size_limit):
  83. chunk_size = 1024
  84. total_size = 0
  85. with requests.get(url, stream=True, timeout=10) as response:
  86. response.raise_for_status()
  87. content = response.headers.get("Content-Disposition")
  88. try: # filename from header
  89. _, params = cgi.parse_header(content)
  90. filename = params["filename"]
  91. except Exception: # filename from url
  92. filename = os.path.basename(url)
  93. with open(save_path / filename, "wb") as file:
  94. for chunk in response.iter_content(chunk_size=chunk_size):
  95. total_size += len(chunk)
  96. if size_limit and total_size > size_limit:
  97. raise gr.Error("Exceeds file size limit")
  98. file.write(chunk)
  99. return save_path / filename
  100. def stop_translate_file(state):
  101. session_id = state["session_id"]
  102. if session_id is None:
  103. return
  104. if session_id in cancellation_event_map:
  105. cancellation_event_map[session_id].set()
  106. def translate_file(
  107. file_type,
  108. file_input,
  109. link_input,
  110. service,
  111. lang_from,
  112. lang_to,
  113. page_range,
  114. recaptcha_response,
  115. state,
  116. progress=gr.Progress(),
  117. *envs,
  118. ):
  119. session_id = uuid.uuid4()
  120. state["session_id"] = session_id
  121. cancellation_event_map[session_id] = asyncio.Event()
  122. """Translate PDF content using selected service."""
  123. if flag_demo and not verify_recaptcha(recaptcha_response):
  124. raise gr.Error("reCAPTCHA fail")
  125. progress(0, desc="Starting translation...")
  126. output = Path("pdf2zh_files")
  127. output.mkdir(parents=True, exist_ok=True)
  128. if file_type == "File":
  129. if not file_input:
  130. raise gr.Error("No input")
  131. file_path = shutil.copy(file_input, output)
  132. else:
  133. if not link_input:
  134. raise gr.Error("No input")
  135. file_path = download_with_limit(
  136. link_input,
  137. output,
  138. 5 * 1024 * 1024 if flag_demo else None,
  139. )
  140. filename = os.path.splitext(os.path.basename(file_path))[0]
  141. file_raw = output / f"{filename}.pdf"
  142. file_mono = output / f"{filename}-mono.pdf"
  143. file_dual = output / f"{filename}-dual.pdf"
  144. translator = service_map[service]
  145. selected_page = page_map[page_range]
  146. lang_from = lang_map[lang_from]
  147. lang_to = lang_map[lang_to]
  148. for i, env in enumerate(translator.envs.items()):
  149. os.environ[env[0]] = envs[i]
  150. print(f"Files before translation: {os.listdir(output)}")
  151. def progress_bar(t: tqdm.tqdm):
  152. progress(t.n / t.total, desc="Translating...")
  153. param = {
  154. "files": [str(file_raw)],
  155. "pages": selected_page,
  156. "lang_in": lang_from,
  157. "lang_out": lang_to,
  158. "service": f"{translator.name}",
  159. "output": output,
  160. "thread": 4,
  161. "callback": progress_bar,
  162. "cancellation_event": cancellation_event_map[session_id],
  163. }
  164. print(param)
  165. try:
  166. translate(**param)
  167. except CancelledError:
  168. del cancellation_event_map[session_id]
  169. raise gr.Error("Translation cancelled")
  170. print(f"Files after translation: {os.listdir(output)}")
  171. if not file_mono.exists() or not file_dual.exists():
  172. raise gr.Error("No output")
  173. progress(1.0, desc="Translation complete!")
  174. return (
  175. str(file_mono),
  176. str(file_mono),
  177. str(file_dual),
  178. gr.update(visible=True),
  179. gr.update(visible=True),
  180. gr.update(visible=True),
  181. )
  182. # Global setup
  183. custom_blue = gr.themes.Color(
  184. c50="#E8F3FF",
  185. c100="#BEDAFF",
  186. c200="#94BFFF",
  187. c300="#6AA1FF",
  188. c400="#4080FF",
  189. c500="#165DFF", # Primary color
  190. c600="#0E42D2",
  191. c700="#0A2BA6",
  192. c800="#061D79",
  193. c900="#03114D",
  194. c950="#020B33",
  195. )
  196. cancellation_event_map = {}
  197. with gr.Blocks(
  198. title="PDFMathTranslate - PDF Translation with preserved formats",
  199. theme=gr.themes.Default(
  200. primary_hue=custom_blue, spacing_size="md", radius_size="lg"
  201. ),
  202. css="""
  203. .secondary-text {color: #999 !important;}
  204. footer {visibility: hidden}
  205. .env-warning {color: #dd5500 !important;}
  206. .env-success {color: #559900 !important;}
  207. /* Add dashed border to input-file class */
  208. .input-file {
  209. border: 1.2px dashed #165DFF !important;
  210. border-radius: 6px !important;
  211. }
  212. .progress-bar-wrap {
  213. border-radius: 8px !important;
  214. }
  215. .progress-bar {
  216. border-radius: 8px !important;
  217. }
  218. """,
  219. head=(
  220. """
  221. <script src="https://www.google.com/recaptcha/api.js?render=explicit" async defer></script>
  222. <script type="text/javascript">
  223. var onVerify = function(token) {
  224. el=document.getElementById('verify').getElementsByTagName('textarea')[0];
  225. el.value=token;
  226. el.dispatchEvent(new Event('input'));
  227. };
  228. </script>
  229. """
  230. if flag_demo
  231. else ""
  232. ),
  233. ) as demo:
  234. gr.Markdown(
  235. "# [PDFMathTranslate @ GitHub](https://github.com/Byaidu/PDFMathTranslate)"
  236. )
  237. with gr.Row():
  238. with gr.Column(scale=1):
  239. gr.Markdown("## File | < 5 MB" if flag_demo else "## File")
  240. file_type = gr.Radio(
  241. choices=["File", "Link"],
  242. label="Type",
  243. value="File",
  244. )
  245. file_input = gr.File(
  246. label="File",
  247. file_count="single",
  248. file_types=[".pdf"],
  249. type="filepath",
  250. elem_classes=["input-file"],
  251. )
  252. link_input = gr.Textbox(
  253. label="Link",
  254. visible=False,
  255. interactive=True,
  256. )
  257. gr.Markdown("## Option")
  258. service = gr.Dropdown(
  259. label="Service",
  260. choices=service_map.keys(),
  261. value="Google",
  262. )
  263. envs = []
  264. for i in range(3):
  265. envs.append(
  266. gr.Textbox(
  267. visible=False,
  268. interactive=True,
  269. )
  270. )
  271. with gr.Row():
  272. lang_from = gr.Dropdown(
  273. label="Translate from",
  274. choices=lang_map.keys(),
  275. value="English",
  276. )
  277. lang_to = gr.Dropdown(
  278. label="Translate to",
  279. choices=lang_map.keys(),
  280. value="Chinese",
  281. )
  282. page_range = gr.Radio(
  283. choices=page_map.keys(),
  284. label="Pages",
  285. value=list(page_map.keys())[0],
  286. )
  287. def on_select_service(service, evt: gr.EventData):
  288. translator = service_map[service]
  289. _envs = []
  290. for i in range(3):
  291. _envs.append(gr.update(visible=False, value=""))
  292. for i, env in enumerate(translator.envs.items()):
  293. _envs[i] = gr.update(
  294. visible=True, label=env[0], value=os.getenv(env[0], env[1])
  295. )
  296. return _envs
  297. def on_select_filetype(file_type):
  298. return (
  299. gr.update(visible=file_type == "File"),
  300. gr.update(visible=file_type == "Link"),
  301. )
  302. output_title = gr.Markdown("## Translated", visible=False)
  303. output_file_mono = gr.File(
  304. label="Download Translation (Mono)", visible=False
  305. )
  306. output_file_dual = gr.File(
  307. label="Download Translation (Dual)", visible=False
  308. )
  309. recaptcha_response = gr.Textbox(
  310. label="reCAPTCHA Response", elem_id="verify", visible=False
  311. )
  312. recaptcha_box = gr.HTML('<div id="recaptcha-box"></div>')
  313. translate_btn = gr.Button("Translate", variant="primary")
  314. cancellation_btn = gr.Button("Cancel", variant="secondary")
  315. tech_details_tog = gr.Markdown(
  316. f"""
  317. <summary>Technical details</summary>
  318. - GitHub: <a href="https://github.com/Byaidu/PDFMathTranslate">Byaidu/PDFMathTranslate</a><br>
  319. - GUI by: <a href="https://github.com/reycn">Rongxin</a><br>
  320. - Version: {__version__}
  321. """,
  322. elem_classes=["secondary-text"],
  323. )
  324. service.select(
  325. on_select_service,
  326. service,
  327. envs,
  328. )
  329. file_type.select(
  330. on_select_filetype,
  331. file_type,
  332. [file_input, link_input],
  333. js=(
  334. f"""
  335. (a,b)=>{{
  336. try{{
  337. grecaptcha.render('recaptcha-box',{{
  338. 'sitekey':'{client_key}',
  339. 'callback':'onVerify'
  340. }});
  341. }}catch(error){{}}
  342. return [a];
  343. }}
  344. """
  345. if flag_demo
  346. else ""
  347. ),
  348. )
  349. with gr.Column(scale=2):
  350. gr.Markdown("## Preview")
  351. preview = PDF(label="Document Preview", visible=True)
  352. # Event handlers
  353. file_input.upload(
  354. lambda x: x,
  355. inputs=file_input,
  356. outputs=preview,
  357. js=(
  358. f"""
  359. (a,b)=>{{
  360. try{{
  361. grecaptcha.render('recaptcha-box',{{
  362. 'sitekey':'{client_key}',
  363. 'callback':'onVerify'
  364. }});
  365. }}catch(error){{}}
  366. return [a];
  367. }}
  368. """
  369. if flag_demo
  370. else ""
  371. ),
  372. )
  373. state = gr.State({"session_id": None})
  374. translate_btn.click(
  375. translate_file,
  376. inputs=[
  377. file_type,
  378. file_input,
  379. link_input,
  380. service,
  381. lang_from,
  382. lang_to,
  383. page_range,
  384. recaptcha_response,
  385. state,
  386. *envs,
  387. ],
  388. outputs=[
  389. output_file_mono,
  390. preview,
  391. output_file_dual,
  392. output_file_mono,
  393. output_file_dual,
  394. output_title,
  395. ],
  396. ).then(lambda: None, js="()=>{grecaptcha.reset()}" if flag_demo else "")
  397. cancellation_btn.click(
  398. stop_translate_file,
  399. inputs=[state],
  400. )
  401. def readuserandpasswd(file_path):
  402. tuple_list = []
  403. content = ""
  404. if len(file_path) == 2:
  405. try:
  406. with open(file_path[1], "r", encoding="utf-8") as file:
  407. content = file.read()
  408. except FileNotFoundError:
  409. print(f"Error: File '{file_path[1]}' not found.")
  410. try:
  411. with open(file_path[0], "r", encoding="utf-8") as file:
  412. tuple_list = [
  413. tuple(line.strip().split(",")) for line in file if line.strip()
  414. ]
  415. except FileNotFoundError:
  416. print(f"Error: File '{file_path[0]}' not found.")
  417. return tuple_list, content
  418. def setup_gui(share=False, authfile=["", ""]):
  419. userlist, html = readuserandpasswd(authfile)
  420. if flag_demo:
  421. demo.launch(server_name="0.0.0.0", max_file_size="5mb", inbrowser=True)
  422. else:
  423. if len(userlist) == 0:
  424. try:
  425. demo.launch(
  426. server_name="0.0.0.0", debug=True, inbrowser=True, share=share
  427. )
  428. except Exception:
  429. print(
  430. "Error launching GUI using 0.0.0.0.\nThis may be caused by global mode of proxy software."
  431. )
  432. try:
  433. demo.launch(
  434. server_name="127.0.0.1", debug=True, inbrowser=True, share=share
  435. )
  436. except Exception:
  437. print(
  438. "Error launching GUI using 127.0.0.1.\nThis may be caused by global mode of proxy software."
  439. )
  440. demo.launch(debug=True, inbrowser=True, share=True)
  441. else:
  442. try:
  443. demo.launch(
  444. server_name="0.0.0.0",
  445. debug=True,
  446. inbrowser=True,
  447. share=share,
  448. auth=userlist,
  449. auth_message=html,
  450. )
  451. except Exception:
  452. print(
  453. "Error launching GUI using 0.0.0.0.\nThis may be caused by global mode of proxy software."
  454. )
  455. try:
  456. demo.launch(
  457. server_name="127.0.0.1",
  458. debug=True,
  459. inbrowser=True,
  460. share=share,
  461. auth=userlist,
  462. auth_message=html,
  463. )
  464. except Exception:
  465. print(
  466. "Error launching GUI using 127.0.0.1.\nThis may be caused by global mode of proxy software."
  467. )
  468. demo.launch(
  469. debug=True,
  470. inbrowser=True,
  471. share=True,
  472. auth=userlist,
  473. auth_message=html,
  474. )
  475. # For auto-reloading while developing
  476. if __name__ == "__main__":
  477. setup_gui()