在Python中使用ElementTree创建多级继承结构XML树

Vineel Phatak, 520, NOBODY Ajay Joshi, 250, Vineel Phatak Abhishek Chauhan, 120, Ajay Joshi Jayesh Godse, 500, NOBODY Vijaya Mundada, 60, Abhishek Chauhan Shital Tuteja, 45, Jayesh Godse Rajan Gawli, 700, Vineel Phatak Zeba Khan, 300, Jayesh Godse Chaitali Sood, 100, Zeba Khan Sheila Rodrigues, 35, Vineel Phatak

<company> <Vineel Phatak> <Ajay Joshi> <Abhishek Chauhan> <Vijaya Mundada /> </Abhishek Chauhan> </Ajay Joshi> <Rajan Gawli /> <Sheila Rodrigues /> </Vineel Phatak> <Jayesh Godse> <Shital Tuteja /> <Zeba Khan> <Chaitali Sood /> </Zeba Khan> </Jayesh Godse> </company>

# Find last employee of the last introduced CEO import xml.etree.ElementTree as ET # Reading Input inD = open('input.txt', 'r') data = inD.readlines() inD.close() # Creating an element and saving all subelement to list all_element = [] company = ET.Element('Company') ceos = [] for i in data: t = i.strip().split(',') if(t[2].strip() == 'NOBODY'): ceos.append(t[0]) all_element.append(ET.SubElement(company, t[0])) # company.clear() # Creating a function to add subelements def findChilds(name, emp): global all_element for i in all_element: if emp == i.tag: name = ET.SubElement(i, name) # If it is CEO hence no emplyer then directly add subelement to company or else add to the previous subelement for j in data: t = j.strip().split(',') if t[2].strip() == 'NOBODY': e = ET.SubElement(company, t[0]) elif t[2].strip() != 'NOBODY': findChilds(t[0].strip(), t[2].strip()) ET.dump(company)

<Company><Vineel Phatak><Ajay Joshi /><Rajan Gawli /><Sheila Rodrigues /></Vineel Phatak><Ajay Joshi><Abhishek Chauhan /></Ajay Joshi><Abhishek Chauhan><Vijaya Mundada /></Abhishek Chauhan><Jayesh Godse><Shital Tuteja /><Zeba Khan /></Jayesh Godse><Vijaya Mundada /><Shital Tuteja /><Rajan Gawli /><Zeba Khan><Chaitali Sood /></Zeba Khan><Chaitali Sood /><Sheila Rodrigues /><Vineel Phatak /><Jayesh Godse /></Company>

1条回答

网友

1楼 · 发布于 2024-09-27 21:26:24

在列出我的示例之前，有一条关于xml结构的注释：在创建xml结构时，最好使用“对象类”作为元素的标记，并将其“属性”（如名称和薪水）存储为xml属性：
<employee name="Vineel Phatak" salary="520"/>
而不是：
<Vineel Phatak/>
这将使解析变得更容易，并为扩展格式提供更大的灵活性

我的例子

您的问题的示例实现：

import csv
from dataclasses import dataclass
import xml.etree.ElementTree as ET


@dataclass
class Employee:
    linenumber: int
    name: str
    salary: str
    manager_name: str
    subordinates: list


employees = {}  # a dictionary to map names to employees

# load employees
with open('company.csv') as csvfile:
    reader = csv.reader(csvfile)
    for linenumber, row in enumerate(reader):
        (name, salary, manager_name) = [value.strip() for value in row]
        employees[name] = Employee(linenumber, name, salary, manager_name, [])


# link employees to their subordinates
ceos = []
for employee in employees.values():
    if employee.manager_name == 'NOBODY':
        # store the ceos in a list to start building the xml from later
        ceos.append(employee)
    else:
        # look up the manager by it name
        manager = employees[employee.manager_name]
        manager.subordinates.append(employee)

# create xml
companyelement = ET.Element('company')

def add_employees_to_xml_element(xmlelement, employees):
    for employee in employees:
        employee_element = ET.Element("employee", {
            "name": employee.name,
            "salary": employee.salary
        })
        xmlelement.append(employee_element)
        add_employees_to_xml_element(employee_element, employee.subordinates)


add_employees_to_xml_element(companyelement, ceos)
ET.dump(companyelement)

# find the last entered ceo
def linenumber_key(ceo): return ceo.linenumber


last_entered_ceo = max(ceos, key=linenumber_key)
print(f"Last entered CEO: {last_entered_ceo.name}")

# find the last entered (in)direct subordinate of the last entered ceo
def find_last_entered_subordinate(employee, current_last=None):
    for subordinate in employee.subordinates:
        if not current_last:
            current_last = subordinate  # ensuring an initial value
        else:
            current_last = max([current_last, subordinate], key=linenumber_key)
        # recursive: travers the subordinate's subordinates
        current_last = find_last_entered_subordinate(subordinate, current_last)
    return current_last


last_employee = find_last_entered_subordinate(last_entered_ceo)
print(f"Last added subordinate of last CEO: {last_employee.name}")

我把练习分为以下几个部分：

将CSV文件中的员工加载到词典中，以方便（并加快）以后按姓名查找员工。我还存储了每个员工的行号，供您以后提问时使用
将员工与其下属联系起来。假设管理人员可能在其下属之后列出，那么在第一步中就不能将其合并。每个员工都会有一份下属名单，首席执行官会被储存在一个单独的“根”名单中
使用元素树和遍历上述创建的CEO列表的递归函数创建xml
查找上次输入的CEO。我们已经有了一个CEO列表，但是因为它是从字典中创建的（字典不能确保元素的检索顺序与添加的顺序相同），所以我不能只取最后一个元素，而是应该找到具有最高行号的CEO
查找上次输入的首席执行官的上次输入的直接下属。与上面类似，这次我使用递归函数根据行号检索此员工

结果xml:

<company>
    <employee name="Vineel Phatak" salary="520">
        <employee name="Ajay Joshi" salary="250">
            <employee name="Abhishek Chauhan" salary="120">
                <employee name="Vijaya Mundada" salary="60"/>
            </employee>
        </employee>
        <employee name="Rajan Gawli" salary="700"/>
        <employee name="Sheila Rodrigues" salary="35"/>
    </employee>
    <employee name="Jayesh Godse" salary="500">
        <employee name="Shital Tuteja" salary="45"/>
        <employee name="Zeba Khan" salary="300">
            <employee name="Chaitali Sood" salary="100"/>
        </employee>
    </employee>
</company>

我的例子

相关问题更多 >

编程相关推荐

热门问题

热门文章