cxumol commited on
Commit
74164b2
·
1 Parent(s): 02fdb50

pre release milestone: generate pdf

Browse files
Files changed (8) hide show
  1. Signature.png +3 -0
  2. app.py +9 -4
  3. data_test.py +8 -0
  4. requirements.txt +1 -0
  5. taskNonAI.py +27 -1
  6. template_base.typ +62 -0
  7. template_letter.tmpl +15 -0
  8. test.py +8 -2
Signature.png ADDED

Git LFS Details

  • SHA256: cf478c8a80a695e91bb7a2a66126ed058ed2ba2f43a997356e1d13a58c095685
  • Pointer size: 129 Bytes
  • Size of remote file: 2.77 kB
app.py CHANGED
@@ -4,7 +4,7 @@ from config import STRONG_API_BASE, STRONG_API_KEY, STRONG_MODEL
4
  from util import is_valid_url
5
  from util import mylogger
6
  from util import stream_together
7
- from taskNonAI import extract_url, file_to_html
8
  from taskAI import TaskAI
9
  ## load data
10
  from data_test import mock_jd, mock_cv
@@ -14,7 +14,7 @@ import gradio as gr
14
  from pypandoc.pandoc_download import download_pandoc
15
  ## std
16
  import os
17
-
18
 
19
  logger = mylogger(__name__,'%(asctime)s:%(levelname)s:%(message)s')
20
  info = logger.info
@@ -89,6 +89,11 @@ def finalize_letter_txt(api_base, api_key, api_model, debug_CoT, jd, cv):
89
  for result in gen:
90
  yield result
91
 
 
 
 
 
 
92
  with gr.Blocks(
93
  title=DEMO_TITLE,
94
  theme=gr.themes.Base(primary_hue="blue", secondary_hue="sky", neutral_hue="slate"),
@@ -175,11 +180,11 @@ with gr.Blocks(
175
  ).then(fn=run_compose, inputs=[strong_base, strong_key, strong_model, min_jd, min_cv], outputs=[debug_CoT]
176
  ).then(fn=lambda:gr.Accordion("Expert Zone", open=False),inputs=None, outputs=[expert_zone]
177
  ).then(fn=finalize_letter_txt, inputs=[cheap_base, cheap_key, cheap_model, debug_CoT, jd_info, cv_text], outputs=[cover_letter_text, debug_jobapp]
178
- )
179
 
180
 
181
  if __name__ == "__main__":
182
  init()
183
- app.queue(max_size=10, default_concurrency_limit=1).launch(
184
  show_error=True, debug=True, share=IS_SHARE
185
  )
 
4
  from util import is_valid_url
5
  from util import mylogger
6
  from util import stream_together
7
+ from taskNonAI import extract_url, file_to_html, compile_pdf
8
  from taskAI import TaskAI
9
  ## load data
10
  from data_test import mock_jd, mock_cv
 
14
  from pypandoc.pandoc_download import download_pandoc
15
  ## std
16
  import os
17
+ import json
18
 
19
  logger = mylogger(__name__,'%(asctime)s:%(levelname)s:%(message)s')
20
  info = logger.info
 
89
  for result in gen:
90
  yield result
91
 
92
+ def finalize_letter_pdf(meta_data, cover_letter_text):
93
+ pdf_context = json.loads(meta_data)
94
+ pdf_context["letter_body"] = cover_letter_text
95
+ return compile_pdf(pdf_context,tmpl_path="template_letter.tmpl",output_path=f"/tmp/cover_letter_{pdf_context['applicant_full_name']}_to_{pdf_context['company_full_name']}.pdf")
96
+
97
  with gr.Blocks(
98
  title=DEMO_TITLE,
99
  theme=gr.themes.Base(primary_hue="blue", secondary_hue="sky", neutral_hue="slate"),
 
180
  ).then(fn=run_compose, inputs=[strong_base, strong_key, strong_model, min_jd, min_cv], outputs=[debug_CoT]
181
  ).then(fn=lambda:gr.Accordion("Expert Zone", open=False),inputs=None, outputs=[expert_zone]
182
  ).then(fn=finalize_letter_txt, inputs=[cheap_base, cheap_key, cheap_model, debug_CoT, jd_info, cv_text], outputs=[cover_letter_text, debug_jobapp]
183
+ ).then(fn=finalize_letter_pdf, inputs=[debug_jobapp, cover_letter_text], outputs=[cover_letter_pdf])
184
 
185
 
186
  if __name__ == "__main__":
187
  init()
188
+ app.queue(max_size=1, default_concurrency_limit=1).launch(
189
  show_error=True, debug=True, share=IS_SHARE
190
  )
data_test.py CHANGED
@@ -65,3 +65,11 @@ References
65
 
66
  Available upon request.
67
  """
 
 
 
 
 
 
 
 
 
65
 
66
  Available upon request.
67
  """
68
+ pdf_context = {
69
+ "company_full_name": "Mastercard",
70
+ "job_title": "Project Management Intern",
71
+ "applicant_full_name": "Dorothy Gale",
72
+ "applicant_contact_information": "123 Main St., Emerald City, KS 12345, (123) 456-7890, [email protected]",
73
+ "letter_body": "text,\n\ntest test"
74
+ }
75
+
requirements.txt CHANGED
@@ -1,6 +1,7 @@
1
  # UI
2
  gradio>=4.0,<=5.0
3
  # external tool
 
4
  pypandoc
5
  shot-scraper
6
  # LLM related
 
1
  # UI
2
  gradio>=4.0,<=5.0
3
  # external tool
4
+ typst
5
  pypandoc
6
  shot-scraper
7
  # LLM related
taskNonAI.py CHANGED
@@ -1,8 +1,14 @@
1
  import pypandoc
 
2
  ## stdlib
3
  import subprocess
4
  import json
 
5
  from typing import Optional
 
 
 
 
6
 
7
  def file_to_html(file_path: str) -> str:
8
  return pypandoc.convert_file(file_path, "html")
@@ -29,4 +35,24 @@ def extract_url(url: str) -> Optional[str]:
29
  except:
30
  raise Exception(
31
  f"Please try copy-paste as input. Failed to extract content from: {url}. Didn't find content from given URL!"
32
- )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import pypandoc
2
+ import typst
3
  ## stdlib
4
  import subprocess
5
  import json
6
+ import os
7
  from typing import Optional
8
+ from string import Template
9
+
10
+ from datetime import datetime
11
+
12
 
13
  def file_to_html(file_path: str) -> str:
14
  return pypandoc.convert_file(file_path, "html")
 
35
  except:
36
  raise Exception(
37
  f"Please try copy-paste as input. Failed to extract content from: {url}. Didn't find content from given URL!"
38
+ )
39
+
40
+ def date():
41
+ current_date = datetime.now()
42
+ return current_date.strftime(
43
+ f"%B %d{'th' if 4 <= current_date.day <= 20 or 24 <= current_date.day <= 30 else ['st', 'nd', 'rd'][current_date.day % 10 - 1]} , %Y")
44
+
45
+ def typst_escape(s):
46
+ return s.replace('@','\@').replace('#','\#')
47
+
48
+ def compile_pdf(context: dict, tmpl_path: str, output_path="/tmp/cover_letter.pdf"):
49
+ with open(tmpl_path, "r", encoding='utf8') as f:
50
+ tmpl = Template(f.read())
51
+ context = {k: typst_escape(v) for k, v in context.items()}
52
+ context.update({'date_string': date()})
53
+ letter_typ = tmpl.safe_substitute(context)
54
+ with open('letter.typ', 'w', encoding='utf8') as f:
55
+ f.write(letter_typ)
56
+ typst.compile('letter.typ', output=output_path)
57
+ os.remove('letter.typ')
58
+ return output_path
template_base.typ ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ // This function gets your whole document as its `body`
2
+ // and formats it as a simple letter.
3
+ #let letter(
4
+ // The letter's sender, which is display at the top of the page.
5
+ sender: none,
6
+
7
+ // The letter's recipient, which is displayed close to the top.
8
+ recipient: none,
9
+
10
+ // The date, displayed to the right.
11
+ date: none,
12
+
13
+ // The subject line.
14
+ subject: none,
15
+
16
+ // The name with which the letter closes.
17
+ name: none,
18
+
19
+ // The letter's content.
20
+ body
21
+ ) = {
22
+ // Configure page and text properties.
23
+ set page(paper: "us-letter", margin: (top: 2cm, bottom: 1.0cm))
24
+ set text(font: "PT Sans")
25
+
26
+ // Display sender at top of page. If there's no sender
27
+ // add some hidden text to keep the same spacing.
28
+ [== #name]
29
+ text(9pt, if sender == none {
30
+ hide("a")
31
+ } else {
32
+ sender
33
+ })
34
+
35
+ v(1.8cm)
36
+
37
+ // Display recipient.
38
+ recipient
39
+
40
+ v(0.5cm)
41
+
42
+ // Display date. If there's no date add some hidden
43
+ // text to keep the same spacing.
44
+ align(right, if date != none {
45
+ date
46
+ } else {
47
+ hide("a")
48
+ })
49
+
50
+ v(2cm)
51
+
52
+ // Add the subject line, if any.
53
+ if subject != none {
54
+ pad(right: 10%, strong(subject))
55
+ }
56
+
57
+ // Add body and name.
58
+ body
59
+ // v(1.25cm)
60
+ image("Signature.png", height: 7%, fit: "stretch")
61
+ name
62
+ }
template_letter.tmpl ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #import "template_base.typ": *
2
+ #show: letter.with(
3
+ sender: [
4
+ ${applicant_contact_information}
5
+ ],
6
+ recipient: [
7
+ Hiring Manager \
8
+ ${company_full_name} \
9
+ ],
10
+ date: [${date_string}],
11
+ subject: [Cover Letter for ${job_title}],
12
+ name: [${applicant_full_name}],
13
+ )
14
+
15
+ ${letter_body}
test.py CHANGED
@@ -1,5 +1,6 @@
1
  from taskAI import TaskAI
2
- from data_test import mock_jd, mock_cv
 
3
  from config_secret import api_test
4
 
5
  from llama_index.llms.openai_like import OpenAILike
@@ -27,6 +28,11 @@ def test_taskAI():
27
  for chunk in gen:
28
  print(chunk)
29
 
 
 
 
 
30
  if __name__ == "__main__":
31
- test_taskAI()
32
  # integration()
 
 
1
  from taskAI import TaskAI
2
+ from taskNonAI import compile_pdf
3
+ from data_test import mock_jd, mock_cv, pdf_context
4
  from config_secret import api_test
5
 
6
  from llama_index.llms.openai_like import OpenAILike
 
28
  for chunk in gen:
29
  print(chunk)
30
 
31
+ def test_typst_pdf():
32
+ compile_pdf(tmpl_path='template_letter.tmpl',context=pdf_context)
33
+ os
34
+
35
  if __name__ == "__main__":
36
+ # test_taskAI()
37
  # integration()
38
+ test_typst_pdf()