python随机抽取行信息

169 阅读1分钟
# coding = utf-8
# 导包
from time import *
import numpy as np
import pandas as pd
import csv
import random

start = time()

# 以utf-8的格式读取csv文件
df = pd.read_csv("0830-delivered.csv")
df.columns = ["rawRowAddr", "jd", "wd", "xxdmc", "table_name", "created_time", "wzxxdms", "xzqhbm", "seq", "带标注语句"]
x = df[["rawRowAddr", "jd", "wd", "xxdmc", "table_name", "created_time", "wzxxdms", "xzqhbm", "seq", "带标注语句"]]
# data的数据类型为<numpy.ndarray>
data = np.array(x)

# 随机获取数据
ids = []
for i in range(len(data)):
    id = random.randint(0,len(data)-1)
    if id not in ids:
        data_list = list(data[id])
        # 防止写入的csv出现空行,newline=""
        out_csv = open("cq.csv",a,newline="")
        csv_write = csv.write(out_csv, dialect="excel")
        csv_write.writerow(data_list)
        ids.append(id)
    if len(ids) == 100:
        break

end = time()
runtime = start - end
print(runtime)