1
+ import os
2
+ import pandas as pd
3
+ import warnings
4
+ import re
5
+ import string
6
+ import pathlib
7
+ warnings .filterwarnings ("ignore" )
8
+ import sys
9
+
10
+ GLOSSARY_HEADER = """# Existing Terms and Definitions
11
+
12
+ """
13
+ BASE_LINK_WIKI = "https://github.com/OpenEnergyPlatform/ontology/wiki/"
14
+ BASE_IRI = "http://openenergy-platform.org/ontology/oeo/"
15
+
16
+ if __name__ == '__main__' :
17
+ arguments = sys .argv [1 :]
18
+ if len (arguments ) > 0 :
19
+ target_path = arguments [0 ]
20
+ else :
21
+ target_path = 'src/scripts/etd'
22
+ cwd = os .getcwd ()
23
+ df = pd .read_excel (pathlib .Path (target_path ).joinpath ("etd.xlsx" ).as_posix ())
24
+
25
+ df = df .replace ('\n ' , '<br>' , regex = True )
26
+ df = df .sort_values ("LABEL" , key = lambda col : col .str .strip ().str .lower ())
27
+ # Create one table per letter:
28
+
29
+ pathlib .Path (cwd + "/src/scripts/etd/glossary/" ).mkdir (parents = True , exist_ok = True )
30
+
31
+ # header = GLOSSARY_HEADER + " ".join([f"[{letter}]({BASE_LINK_WIKI}{letter})" for letter in string.ascii_uppercase]) + "\n"
32
+
33
+ # with open(cwd + "/src/scripts/etd/glossary/glossary.md", "w") as fil:
34
+ # fil.write(header)
35
+ output = GLOSSARY_HEADER + "\n "
36
+ for letter in string .ascii_lowercase :
37
+ current_df = df [df ["LABEL" ].str .lower ().str .startswith (letter )]
38
+ if current_df .empty :
39
+ continue
40
+ buffer = current_df .to_markdown (index = False )
41
+ buffer = re .sub (r"(?s)(http:\/\/openenergy-platform.org\/ontology\/oeo\/?)\w+-\w+\/(\w+)(?=_)_(\d+?)(?=\s)" , r"\2:\3" , buffer )
42
+ # There is a weird typo in surface azimuth angle ?
43
+ buffer = re .sub (r"(?s)(http:\/\/opennergy-plattform.org\/ontology\/oeo\/?)\/(\w+)(?=_)_(\d+?)(?=\s)" , r"\2:\3" , buffer )
44
+ # Remove the thing above when the typo is fixed
45
+ buffer = re .sub (r"(?s)(\w+?)(?=:):(\d+?)(?=\s)" , r"[\1:\2]({}" .format (BASE_IRI )+ r"\1_\2)" , buffer )
46
+ title = f"## { letter .capitalize ()} \n \n "
47
+ table = title + buffer + "\n \n "
48
+ #df.to_markdown(buf=cwd + "/src/scripts/etd/ETD.md", index=False)
49
+ output += table
50
+ with open (pathlib .Path (target_path ).joinpath ("glossary/glossary.md" ).as_posix (), "w" ) as fil :
51
+ fil .write (output )
52
+
53
+ # create csv output
54
+ df_csv = df .copy ()
55
+ df_csv ["ID" ] = df_csv ["ID" ].str .replace ("http://openenergy-platform.org/ontology/oeo/oeo-physical/" , "" )
56
+ df_csv ["ID" ] = df_csv ["ID" ].str .replace ("http://openenergy-platform.org/ontology/oeo/oeo-model/" , "" )
57
+ df_csv ["ID" ] = df_csv ["ID" ].str .replace (":" , "_" )
58
+ df_csv .to_csv (pathlib .Path (target_path ).joinpath ("glossary/glossary.csv" ).as_posix (), index = False )
0 commit comments