57 lines
2.1 KiB
Python
57 lines
2.1 KiB
Python
|
import pandas as pd
|
||
|
from neo4j import GraphDatabase
|
||
|
import argparse
|
||
|
import os
|
||
|
from dotenv import load_dotenv
|
||
|
|
||
|
# Load environment variables from .env file
|
||
|
load_dotenv()
|
||
|
|
||
|
def create_neo4j_session(uri, user, password):
|
||
|
return GraphDatabase.driver(uri, auth=(user, password))
|
||
|
|
||
|
def create_node(tx, node_type, properties):
|
||
|
# Create a Cypher query to create a node with given type and properties
|
||
|
properties_string = ', '.join([f"{key}: '{value}'" for key, value in properties.items()])
|
||
|
query = f"CREATE (n:{node_type} {{{properties_string}}})"
|
||
|
tx.run(query)
|
||
|
|
||
|
def main(csv_file_path):
|
||
|
# Read environment variables
|
||
|
NEO4J_URI = os.getenv("NEO4J_URI")
|
||
|
NEO4J_USER = os.getenv("NEO4J_USER")
|
||
|
NEO4J_PASSWORD = os.getenv("NEO4J_PASSWORD")
|
||
|
|
||
|
if not all([NEO4J_URI, NEO4J_USER, NEO4J_PASSWORD]):
|
||
|
raise ValueError("Neo4j URI, user, and password must be set in the environment variables.")
|
||
|
|
||
|
# Read the CSV file into a DataFrame
|
||
|
df = pd.read_csv(csv_file_path, delimiter='^', usecols=['type', 'id', 'title', 'description', 'url', 'date_enacted', 'date_repealed'])
|
||
|
|
||
|
# Connect to Neo4j
|
||
|
driver = create_neo4j_session(NEO4J_URI, NEO4J_USER, NEO4J_PASSWORD)
|
||
|
|
||
|
with driver.session() as session:
|
||
|
for _, row in df.iterrows():
|
||
|
node_type = row['type']
|
||
|
properties = {
|
||
|
'id': str(row['id']),
|
||
|
'title': row['title'],
|
||
|
'description': row['description'],
|
||
|
'url': row['url'],
|
||
|
'date_enacted': pd.to_datetime(row['date_enacted']).strftime('%Y-%m-%d') if pd.notnull(row['date_enacted']) else None,
|
||
|
'date_repealed': pd.to_datetime(row['date_repealed']).strftime('%Y-%m-%d') if pd.notnull(row['date_repealed']) else None
|
||
|
}
|
||
|
|
||
|
# Create the node in Neo4j
|
||
|
session.write_transaction(create_node, node_type, properties)
|
||
|
|
||
|
driver.close()
|
||
|
|
||
|
if __name__ == "__main__":
|
||
|
parser = argparse.ArgumentParser(description="Read a CSV file and create nodes in Neo4j.")
|
||
|
parser.add_argument("csv_file_path", type=str, help="Path to the CSV file")
|
||
|
|
||
|
args = parser.parse_args()
|
||
|
main(args.csv_file_path)
|