日常开发中,我们总是需要将一些文件写入到缓存中。而读文件较快的方式就是python了,另外python提供了非常好用的api帮助我们连接redis。本例中将会用rediscluster包来连接redis集群,并使用pipeline管道插入文件
# encoding: utf-8
from rediscluster import StrictRedisCluster
import sys
import os
import datetime
# redis_nodes = [{"host": "10.80.23.175", "port": 7000},
# {"host": "10.80.23.175", "port": 7001},
# {"host": "10.80.24.175", "port": 7000},
# {"host": "10.80.24.175", "port": 7001},
# {"host": "10.80.25.175", "port": 7000},
# {"host": "10.80.25.175", "port": 7001}
# ]
def redis_cluster():
redis_nodes = [{"host": "10.80.23.175", "port": 7000},
{"host": "10.80.23.175", "port": 7001},
{"host": "10.80.24.175", "port": 7000},
{"host": "10.80.24.175", "port": 7001},
{"host": "10.80.25.175", "port": 7000},
{"host": "10.80.25.175", "port": 7001}
]
try:
redisconn = StrictRedisCluster(startup_nodes=redis_nodes,
skip_full_coverage_check=True)
return redisconn
except Exception as e:
print("Connect Error!")
sys.exit(1)
def to_redis(redis_conn1, file_name):
# file_name = "D:\data\logs\hippo.log"
pipe = redis_conn1.pipeline()
# pos = []
index = 0
count = 0
with open(file_name, 'r') as file_to_read:
while True:
lines = file_to_read.readline()
lines = lines.replace("\n", "")
if not lines:
break
pass
s = lines.split("\t")
value = s[1]
key = s[0]
result = pipe.lpush(key, value)
# print(file_name + s)
index = index + 1
if index > 5000:
pipe.execute()
index = 0
count = count + 1
print("execute insert! count is %d" % count)
pass
pass
pipe.execute()
def read_file(path):
if os.path.isfile(path):
print("start execute file %s" % path)
to_redis(path)
else:
for root, dirs, files in os.walk(path):
# print('root_dir:', root) # 当前目录路径
# print('sub_dirs:', dirs) # 当前路径下所有子目录
print('files:', files) # 当前路径下所有非目录子文件
for fileName in files:
all_name = root + "/" + fileName
print("start execute file %s" % all_name)
to_redis(redis_conn, all_name)
start_time = datetime.datetime.now()
redis_conn = redis_cluster()
file_paths = sys.argv[1]
# 第一个参数是本文件 故去掉
#file_paths.pop[0]
#for file_name in file_paths:
#print(file_paths)
read_file(file_paths)
end_time = datetime.datetime.now()
print("use times is %d " % (end_time - start_time).seconds)
在使用的时候需要将要插入的文件以参数形式传入到命令中
例如,将 /data/a.log 插入到redis中
python RedisFIleToRedis.py /data/a.log