cpg2py 1.0.2__py3-none-any.whl → 1.0.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
cpg2py/__init__.py CHANGED
@@ -1,11 +1,24 @@
1
+ import os
1
2
  from pathlib import Path
2
3
  from csv import DictReader
3
4
  from .cpg import _Graph
4
5
  from .abc import *
5
6
 
7
+ def __remove_null_bytes(file_path: Path) -> Path:
8
+ """Create a new clean file without NULL bytes and return its path."""
9
+ clean_path = file_path.with_suffix(".clean.csv") # Create a temp clean file
10
+ if clean_path.exists(): os.remove(clean_path)
11
+ with open(file_path, "rb") as f:
12
+ content = f.read().replace(b"\x00", b"") # Remove NULL bytes
13
+ with open(clean_path, "wb") as f:
14
+ f.write(content)
15
+ return clean_path
16
+
6
17
  def cpg_graph(node_csv: Path, edge_csv: Path) -> _Graph:
18
+ # Clean files before reading
19
+ tmp_node_csv = __remove_null_bytes(node_csv)
7
20
  storage = Storage()
8
- with open(node_csv, 'r') as n_file:
21
+ with open(tmp_node_csv, 'r') as n_file:
9
22
  reader = DictReader(n_file, delimiter='\t')
10
23
  for node_props in reader:
11
24
  nid = node_props.get("id:int", None)
@@ -14,7 +27,9 @@ def cpg_graph(node_csv: Path, edge_csv: Path) -> _Graph:
14
27
  print(f"Node {nid} already exists in the graph")
15
28
  if not storage.set_node_props(nid, node_props):
16
29
  print(f"Failed to set properties for node {nid}")
17
- with open(edge_csv, 'r') as f:
30
+ if tmp_node_csv.exists(): os.remove(tmp_node_csv)
31
+ tmp_edge_csv = __remove_null_bytes(edge_csv)
32
+ with open(tmp_edge_csv, 'r') as f:
18
33
  reader = DictReader(f, delimiter='\t')
19
34
  for edge_props in reader:
20
35
  f_nid = str(edge_props.get("start", None) )
@@ -28,6 +43,7 @@ def cpg_graph(node_csv: Path, edge_csv: Path) -> _Graph:
28
43
  print(f"Edge {f_nid} -> {t_nid} already exists in the graph")
29
44
  if not storage.set_edge_props(edge_id, edge_props):
30
45
  print(f"Failed to set properties for edge {edge_id}")
46
+ if tmp_edge_csv.exists(): os.remove(tmp_edge_csv)
31
47
  return _Graph(storage)
32
48
 
33
49
 
cpg2py/cpg/edge.py CHANGED
@@ -1,6 +1,5 @@
1
1
  from __future__ import annotations
2
2
  from typing import Optional, Tuple
3
- from enum import Enum
4
3
  from ..abc import AbcGraphQuerier, AbcEdgeQuerier
5
4
 
6
5
  class _Edge(AbcEdgeQuerier):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: cpg2py
3
- Version: 1.0.2
3
+ Version: 1.0.3
4
4
  Summary: A graph-based data structure designed for querying CSV files in Joern format in Python
5
5
  Home-page: https://github.com/YichaoXu/cpg2py
6
6
  Author: Yichao Xu
@@ -1,15 +1,15 @@
1
- cpg2py/__init__.py,sha256=bjd1EjYmNa0N8DW4tSQg-YpzzkqgtBVR2FrgDZReY10,1557
1
+ cpg2py/__init__.py,sha256=InP4wevhbz1-Yp8cy-K3m1Bo8vJFaHfQLDEjeBrXVIg,2262
2
2
  cpg2py/abc/__init__.py,sha256=HgDXsJkGcPQvr6ac3hMrUU9TuQibMaP7-oXbXLs_iLI,207
3
3
  cpg2py/abc/edge.py,sha256=zLlRebDKT2qK5XOJq23_UUCESgGsvgalbXdx_uUcKks,1240
4
4
  cpg2py/abc/graph.py,sha256=DbeHN6qsNaqcqL9cUquJWC16BihDxy1MEhyuL-qVMBI,3902
5
5
  cpg2py/abc/node.py,sha256=E2EQv_KisEPuslFaglZZvSBm-VY5LYCFBOFY1yiPzDY,844
6
6
  cpg2py/abc/storage.py,sha256=BF82Vs_7FxGYSPiM_6JwQVzmaqMzGy2r-WSk8pQQclY,5976
7
7
  cpg2py/cpg/__init__.py,sha256=fO59Yd7OISyxdjdZDJ5zFM41r4cYKawOsvpqV4gWrGM,48
8
- cpg2py/cpg/edge.py,sha256=_ERU_lS4_5AxlOiuX73JvTZBSr9o8ae0q-kWwO82580,1029
8
+ cpg2py/cpg/edge.py,sha256=brG7cQl7tjihbUCBYyjNUnMLsKIif-XQc_TFdGz8ZYo,1007
9
9
  cpg2py/cpg/graph.py,sha256=n4EjAhhjzl0XRJBwlAmK5AcSrECiqhjA6dXt2Ucf7IM,3448
10
10
  cpg2py/cpg/node.py,sha256=-2xl8c-eSbe4Kv4xPAEf6POlCYOV4j0voxJAKDZj3Cc,2037
11
- cpg2py-1.0.2.dist-info/LICENSE,sha256=vTjbt7iL1hUilI8E87FoQerEDa9nbpeip26iA6bguHI,1066
12
- cpg2py-1.0.2.dist-info/METADATA,sha256=dCiQ4H2zcFC9AfFVOsSAkzFJDsKccGwcuyGYCnj9LRs,7077
13
- cpg2py-1.0.2.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
14
- cpg2py-1.0.2.dist-info/top_level.txt,sha256=xDY8faKh5Rczvsqb5Jt9Sq-Y7EOImh7jh-m1oVTnH5k,7
15
- cpg2py-1.0.2.dist-info/RECORD,,
11
+ cpg2py-1.0.3.dist-info/LICENSE,sha256=vTjbt7iL1hUilI8E87FoQerEDa9nbpeip26iA6bguHI,1066
12
+ cpg2py-1.0.3.dist-info/METADATA,sha256=PTXtPmIDRjlyIZBOZJ_fXWrYMwK73WHlVoG6jHZFBMM,7077
13
+ cpg2py-1.0.3.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
14
+ cpg2py-1.0.3.dist-info/top_level.txt,sha256=xDY8faKh5Rczvsqb5Jt9Sq-Y7EOImh7jh-m1oVTnH5k,7
15
+ cpg2py-1.0.3.dist-info/RECORD,,
File without changes