We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9285f5f commit 1acd2edCopy full SHA for 1acd2ed
adi_function_app/pre_embedding_cleaner.py
@@ -71,11 +71,10 @@ def clean_text(src_text: str) -> str:
71
try:
72
# Define specific patterns for each tag
73
tag_patterns = {
74
- "figurecontent": r"<!-- FigureContent=(.*?)-->",
+ "figurecontent": r"<!--.*?FigureContent=(.*?)-->",
75
"figure": r"<figure>(.*?)</figure>",
76
"figures": r"\(figures/\d+\)(.*?)\(figures/\d+\)",
77
- "figcaption": r"<figcaption>(.*?)</figcaption>",
78
- "figureidandcontent": r'<!--\s*FigureId="[^"]*"\s*FigureContent="[^"]*"\s*-->'
+ "figcaption": r"<figcaption>(.*?)</figcaption>"
79
}
80
cleaned_text = remove_markdown_tags(src_text, tag_patterns)
81
0 commit comments