Shami96 commited on
Commit
31d231c
·
verified ·
1 Parent(s): 50613d0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -7
app.py CHANGED
@@ -5,15 +5,22 @@ from utils import extract_text_from_pdf, parse_pdf_to_dict
5
 
6
  from docx.shared import RGBColor
7
 
8
- def replace_red_text_with_data(doc_path, data_dict):
9
- doc = Document(doc_path)
 
 
 
10
 
11
  for para in doc.paragraphs:
12
- for run in para.runs:
13
- if run.font.color and run.font.color.rgb and run.font.color.rgb == RGBColor(255, 0, 0):
14
- text = run.text.strip()
15
- if text in data_dict:
16
- run.text = data_dict[text]
 
 
 
 
17
 
18
  return doc
19
 
 
5
 
6
  from docx.shared import RGBColor
7
 
8
+ from docx import Document
9
+ from docx.shared import RGBColor
10
+
11
+ def replace_red_text_with_data(word_path, data_dict):
12
+ doc = Document(word_path)
13
 
14
  for para in doc.paragraphs:
15
+ full_text = para.text
16
+ for i, run in enumerate(para.runs):
17
+ if run.font.color and run.font.color.rgb == RGBColor(255, 0, 0):
18
+ # Search for the key (label) before this red text
19
+ preceding_text = ''.join(r.text for r in para.runs[:i]).lower()
20
+ for key in data_dict:
21
+ if key.lower() in preceding_text:
22
+ run.text = data_dict[key]
23
+ break
24
 
25
  return doc
26