自动将 csv 文件插入 mysql table

Question

我正在尝试将大约 2000 个 csv 文件中的每一行插入 mysql table。使用以下代码，我只从一个文件中插入了一行。我怎样才能使代码自动化，以便它为每个文件插入所有行？插入只需完成一次。

import pymysql.cursors
connection = pymysql.connect(host='localhost',
                         user='s',
                         password='n9',
                         db='si',
                         charset='utf8mb4',
                         cursorclass=pymysql.cursors.DictCursor)

try:
with connection.cursor() as cursor:
    sql = "INSERT INTO `TrainsS` (`No.`, `Name`,`Zone`,`From`,`Delay`,`ETA`,`Location`,`To`) VALUES (%s,%s,%s,%s,%s,%s,%s, %s)"
    cursor.execute(sql, ('03', 'P Exp','SF','HWH', 'none','no arr today','n/a','ND'))


connection.commit()
finally:
connection.close()

Answer 1

检查这段代码如何？

至运行，您可以将所有 .csv 文件放在一个文件夹中，然后 os.walk(folder_location) 该文件夹以获取所有 .csv 文件的位置，然后我已将它们一一打开并在此处插入所需的数据库 (MySQL)。

import pandas as pd
import os
import subprocess
import warnings
warnings.simplefilter("ignore")

cwd = os.getcwd()

connection = pymysql.connect(host='localhost',
                     user='s',
                     password='n9',
                     db='si',
                     charset='utf8mb4',
                     cursorclass=pymysql.cursors.DictCursor)
files_csv = []
for subdir, dir, file in os.walk(cwd):
    files_csv += [ fi for fi in file if fi.endswith(".csv") ]

print(files_csv)

for i in range(len(files_csv)):
    with open(os.path.join(cwd, files_csv[i])) as f:
        lis=[line.split() for line in f]
        for i,x in enumerate(lis):
            #print("line{0} = {1}".format(i,x))
            #HERE x contains the row data and you can access it individualy using x[0], x[1], etc
            #USE YOUR MySQL INSERTION commands here and insert the x row here.
            with connection.cursor() as cursor:
                sql = "INSERT INTO `TrainsS` (`No.`, `Name`,`Zone`,`From`,`Delay`,`ETA`,`Location`,`To`) VALUES (%s,%s,%s,%s,%s,%s,%s, %s)"
                cursor.execute(sql, (#CONVERTED VALUES FROM x))


connection.commit()

更新- 获取 (#CONVERTED VALUES FROM X)

的值

values = ""
for i in range(len(columns)):
    values = values + x[i] + "," # Here x[i] gives a record data in ith row. Here i'm just appending the all values to be inserted in the sql table.
values = values[:-1] # Removing the last extra comma.
command = "INSERT INTO `TrainsS` (`No.`, `Name`,`Zone`,`From`,`Delay`,`ETA`,`Location`,`To`) VALUES (" + str(values) + ")"
cursor.execute(command)
#Then commit using connection.commit()

Answer 2

     import psycopg2
     import time
     import csv
     conn = psycopg2.connect(
             host = "localhost",
              database = "postgres",
              user = "postgres",
              password = "postgres"
             )
     cur = conn.cursor()
     start = time.time()
     with open('combined_category_data_100 copy.csv', 'r') as file:
          reader=csv.reader(file)
          ncol = len(next(reader))
          next(reader)
          for row in reader:
                  cur.execute(" insert into data values (%s = (no. of columns 
                   ))", row)

          conn.commit()
          print("data entered successfully")
          end = time.time()
          print(f" time taken is {end - start}")
          cur.close()

自动将 csv 文件插入 mysql table

Automated insertion of csv files into mysql table

mysql

csv

python-3.x

pymysql