添加到元素到标头

import xml.etree.cElementTree as cET import pandas as pd from pathlib import Path def phones_to_df(fname): tree = cET.parse(fname) return pd.DataFrame([{**{el.tag: el.text for el in list(phone)}, **{f'nuk_{k}': v for k, v in phone.find('nuk').items()}} for phone in tree.iterfind('Phones')]) if __name__ == '__main__': xmls = [f for f in Path('C:/Users/Desktop/Original/test').glob('*.xml')] df = pd.concat([phones_to_df(xml) for xml in xmls]) df.to_csv("C:/Users/Desktop/Original/all.csv")

<Data xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema"> <Phones> <Date /> <Prog /> <Box /> <Feature /> <PR>1231</PR> <Set>234234</Set> <FD>23423</FD> <Reno>454</Reno> <Simple>dfasd</Simple> <Nr /> <gt>6070106091</gt> <Reno>1233</Reno> <QW>3234</QW> <ER /> <VR /> <Use /> <Dar>sdfsd</Dar> <age /> <name1>sdfsfdfs</name1> <Sys>Itone</Sys> <aac>2014</aac> <time>02:00</time> <nuk name="This is some text" text_g="asadsdas" text_h="2">fsdfsfd3432fdf</nuk> </Phones> </Data>

1条回答

网友

1楼 · 发布于 2024-09-24 22:25:13

如果Phones中的节点是唯一的，您只需调整正在构建的字典以创建数据帧，并添加所需的额外列：

def phones_to_df(fname):
    tree = cET.parse(fname)
    return pd.DataFrame([{'PLAN': f'{phone.find("PR").text}_{phone.find("Reno").text}',
                          **{el.tag: el.text for el in phone},
                          **{f'nuk_{k}': v for k, v in phone.find('nuk').items()}
                          }
                  for phone in tree.iterfind('Phones')])

相关问题更多 >

编程相关推荐

热门问题

热门文章