projectEli/Database/items/createTables.py

79 lines
2.7 KiB
Python
Raw Normal View History

import sqlite3
import os
import csv
def get_data_type(value):
try:
int(value)
return "INTEGER"
except ValueError:
try:
float(value)
return "REAL"
except ValueError:
return "TEXT"
2023-09-06 02:59:56 +00:00
# Connect to the SQLite database and delete existing tables
conn = sqlite3.connect("database.db")
cursor = conn.cursor()
# Get a list of CSV files in the "data" directory
data_dir = "data" # Change this to your data directory path
csv_files = [f for f in os.listdir(data_dir) if f.endswith(".csv")]
2023-09-06 02:59:56 +00:00
# Drop all existing tables except for sqlite_sequence
cursor.execute("PRAGMA foreign_keys = OFF;")
cursor.execute(
"SELECT name FROM sqlite_master WHERE type='table' AND name NOT LIKE 'sqlite_sequence';"
)
existing_tables = cursor.fetchall()
for table in existing_tables:
cursor.execute(f"DROP TABLE IF EXISTS {table[0]};")
# Commit the changes to delete existing tables
conn.commit()
# Iterate through CSV files and create new tables
for csv_file in csv_files:
2023-09-06 02:59:56 +00:00
table_name = os.path.splitext(csv_file)[0]
2023-09-06 02:59:56 +00:00
# Read the first row of the CSV file to determine the column names
with open(os.path.join(data_dir, csv_file), newline="") as csvfile:
csv_reader = csv.reader(csvfile)
header = next(csv_reader)
2023-09-06 02:59:56 +00:00
# Read the second row to determine data types
with open(os.path.join(data_dir, csv_file), newline="") as csvfile:
csv_reader = csv.reader(csvfile)
next(csv_reader) # Skip the header row
data_row = next(csv_reader)
data_types = [get_data_type(value) for value in data_row]
# Add a primary key column if needed (replace 'unique_id' with your unique identifier column name)
if "unique_id" in header:
header[header.index("unique_id")] += " PRIMARY KEY"
# Generate the CREATE TABLE statement dynamically based on the column names and data types
create_table_sql = f"CREATE TABLE IF NOT EXISTS {table_name} (\n"
for column_name, data_type in zip(header, data_types):
create_table_sql += f" {column_name} {data_type},\n"
create_table_sql = create_table_sql.rstrip(",\n") + "\n);"
# Execute the CREATE TABLE statement
cursor.execute(create_table_sql)
2023-09-06 02:59:56 +00:00
# Read and insert data from the CSV file into the table
with open(os.path.join(data_dir, csv_file), newline="") as csvfile:
csv_reader = csv.reader(csvfile)
next(csv_reader) # Skip the header row
for row in csv_reader:
placeholders = ",".join(["?"] * len(row))
insert_sql = f"INSERT INTO {table_name} VALUES ({placeholders});"
cursor.execute(insert_sql, row)
# Commit the changes and close the connection
conn.commit()
conn.close()