-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathremove_hyperlinks.py
46 lines (34 loc) · 1.71 KB
/
remove_hyperlinks.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
import re
import os
# Change the working directory to 'docs/'
os.chdir("docs/")
# Function to remove relative links from the provided file paths
def remove_relative_links(file_paths):
# Regex pattern to match markdown links
link_pattern = re.compile(r'\[([^\]]+)\]\(([^)]+)\)')
for file_path in file_paths:
with open(file_path, 'r', encoding='utf-8') as file:
content = file.read()
def replace_link(match):
text = match.group(1)
url = match.group(2)
# Check if the URL is a relative link (does not contain http or https)
if not url.startswith(('http://', 'https://')):
return text # Return only the text, removing the link
return match.group(0) # Return the whole match unchanged
# Process content to remove relative links
new_content = re.sub(link_pattern, replace_link, content)
with open(file_path, 'w', encoding='utf-8') as file:
file.write(new_content)
# List all .md files in the current directory
all_md_files = [file for file in os.listdir() if file.endswith('.md')]
# Define the stoplist of files to ignore
stoplist =["changelog.md","impressum.md","index.md", "introduction.md","mermaid.md"]
# Filter out the files in the stoplist
file_paths_to_process = [file for file in all_md_files if file not in stoplist]
# Process the remaining files
remove_relative_links(file_paths_to_process)
# Example usage
#file_paths = ["in-situ_observation.md","information.md","introduction.md","location.md","measurand.md","measurement.md","observation.md","uncertainty.md"]
#stoplist =["changelog.md","impressum.md","index.md", "introduction.md","mermaid.md"]
# file_paths = ["uncertainty.md"]