MENU

Python用于清理elasticsearch脚本~

February 25, 2020 • Linux运维工作,Python蟒蛇

用于清理elasticsearch数据,放着自己记录看一下。第一次用yield
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
''' elasticsearch clean '''
__author__ = 'jiangjw'

import requests
import heapq
import traceback
import datetime


class Esclean(object):
    def __init__(self, host, port):
        self.host = host
        self.port = str(port)

    def setting(self):
        self.urlName = 'http://' + self.host + ":" + self.port + '/_cat/indices'
        self.urlDel = 'http://' + self.host + ':' + self.port + '/'

    def getName(self):
        try:
            dataResponse = requests.get(self.urlName)
            dataResponse.raise_for_status()
            dataName = dataResponse.text
            # 循环每一行,再通过split截取需要的部分,写入列表
            for line in dataName.splitlines():
                name = line.split()[2]
                yield name
        except:
            traceback.print_exc()

    def filterName(self):
        today = datetime.date.today()
        todayNumber = int(str(today).replace('-', ""))
        self.filebeat = {}
        for name in self.getName():
            # 截取最后一截,用于比对
            nameDate = name.replace('.', '-').split('-')[-3:]
            nameDate = ''.join(nameDate)
            if nameDate.isdigit():
                nameDate = int(nameDate)
                if nameDate > 99999999:
                    nameDate = str(nameDate)[-6:]
                    self.filebeat[nameDate] = name
                    continue
                if nameDate + 2 <= todayNumber:
                    delName = name
                    yield delName

    def filterBeat(self):
        beatName = heapq.nlargest(1, self.filebeat)
        for i in self.filebeat:
            if i not in beatName:
                yield self.filebeat.get(i)

    def deleteName(self):
        for u in self.filterName():
            try:
                deleteUrl = self.urlDel + u
                response = requests.delete(url=deleteUrl)
                response.raise_for_status()
            except:
                traceback.print_exc()

        for f in self.filterBeat():
            try:
                deleteUrl = self.urlDel + f
                response = requests.delete(url=deleteUrl)
                response.raise_for_status()
            except:
                traceback.print_exc()


def main():
    start = datetime.datetime.now()
    host = '192.168.110.174'
    port = 9200
    es = Esclean(host=host, port=port)
    es.setting()
    es.deleteName()
    end = datetime.datetime.now()
    print("{}运行完成,脚本共耗时:{}s".format(start, (end - start).seconds))


if __name__ == '__main__':
    main()
Last Modified: March 30, 2023