Skip to content
Snippets Groups Projects
Commit 38d5c8cb authored by Remi  PLANEL's avatar Remi PLANEL
Browse files

Fix: Wrong pfam format

parent 3861d26c
No related branches found
No related tags found
No related merge requests found
Pipeline #120015 passed with stages
in 9 minutes and 35 seconds
source diff could not be displayed: it is too large. Options to address this: view the blob.
...@@ -178,7 +178,7 @@ def systems( ...@@ -178,7 +178,7 @@ def systems(
with open(pfam, "r") as pf: with open(pfam, "r") as pf:
pfam_df = pd.read_csv(pf, index_col="AC", keep_default_na=False) pfam_df = pd.read_csv(pf, index_col="AC", keep_default_na=False)
systems = [] systems = []
if (output.exists()): if output.exists():
output.unlink() output.unlink()
with open(output, "a") as ty: with open(output, "a") as ty:
for file in dir.iterdir(): for file in dir.iterdir():
...@@ -188,8 +188,8 @@ def systems( ...@@ -188,8 +188,8 @@ def systems(
metadata, _ = frontmatter.parse(f.read()) metadata, _ = frontmatter.parse(f.read())
del metadata["layout"] del metadata["layout"]
sanitizedMetadata = {**metadata} sanitizedMetadata = {**metadata}
if "tableColumns" in metadata: if "tableColumns" in sanitizedMetadata:
table_data = metadata["tableColumns"] table_data = sanitizedMetadata["tableColumns"]
if "PFAM" in table_data: if "PFAM" in table_data:
pfams_list = [ pfams_list = [
pfam.strip() pfam.strip()
...@@ -204,7 +204,6 @@ def systems( ...@@ -204,7 +204,6 @@ def systems(
pfam_to_dict[pfam]["AC"] = pfam pfam_to_dict[pfam]["AC"] = pfam
flatten_value = pfam_to_dict[pfam] flatten_value = pfam_to_dict[pfam]
pfam_metadata.append(flatten_value) pfam_metadata.append(flatten_value)
except KeyError as err: except KeyError as err:
console.print(f"[bold red]{err}", style="red") console.print(f"[bold red]{err}", style="red")
console.print( console.print(
...@@ -215,14 +214,16 @@ def systems( ...@@ -215,14 +214,16 @@ def systems(
sanitizedMetadata["PFAM"] = pfam_metadata sanitizedMetadata["PFAM"] = pfam_metadata
if "article" in table_data: if "article" in table_data:
metadata["doi"] = table_data["article"]["doi"] sanitizedMetadata["doi"] = table_data["article"]["doi"]
if "abstract" in table_data["article"]: if "abstract" in table_data["article"]:
metadata["abstract"] = table_data["article"][ sanitizedMetadata["abstract"] = table_data["article"][
"abstract" "abstract"
] ]
del table_data["article"] del table_data["article"]
del metadata["tableColumns"] if "PFAM" in table_data:
sanitizedMetadata = {**metadata, **table_data} del table_data["PFAM"]
del sanitizedMetadata["tableColumns"]
sanitizedMetadata = {**sanitizedMetadata, **table_data}
systems.append(sanitizedMetadata) systems.append(sanitizedMetadata)
json_object = json.dumps(systems, indent=2) json_object = json.dumps(systems, indent=2)
......
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment