将txt文件转为xml文件以适配图像标注工具labelimg或Pascal VOC XML 格式

labelImg

🎉 超级实用！LabelImg，图像标注神器，现在加入Label Studio社区，享受多模态数据标注新体验！🚀 简单易用，支持XML、YOLO和CreateML格式，适用于ImageNet等项目。不再单独维护，立即尝试Label Studio，安装一键到位，更灵活，功能更强大！👇 安装即刻开始：pip3 install labelImg，或访问<https://github.com/heartexlabs/label-studio> 获取源码构建。一起探索数据标注的新边界！👨‍💻👩‍💻【此简介由AI生成】

项目地址：https://gitcode.com/gh_mirrors/la/labelImg

免费下载资源

Anymake

5305人浏览 · 2018-07-06 15:45:06

Anymake · 2018-07-06 15:45:06 发布

labelimg作为图像领域目标检测、图像语义分割等领域常见的标注工具，输出的数据格式是Pascal VOC，实际工作中，我们经常需要把其他标注格式为txt的文件转为VOC的xml文件格式，下面的代码提供txt转VOC格式的xml文件的功能。

from xml.dom.minidom import Document
import os
import os.path
from PIL import Image

ann_path = "/Users/label_result.txt"
img_path = "/Users/"
xml_path = "/Users/"

if not os.path.exists(xml_path):
    os.mkdir(xml_path)

def writeXml(tmp, imgname,imgpath, w, h, label_list, wxml, attributes_list):
    doc = Document()
    #owner
    annotation = doc.createElement('annotation')
    doc.appendChild(annotation)
    #owner
    folder = doc.createElement('folder')
    annotation.appendChild(folder)
    folder_txt = doc.createTextNode("R_dataset")
    folder.appendChild(folder_txt)

    filename = doc.createElement('filename')
    annotation.appendChild(filename)
    filename_txt = doc.createTextNode(imgname)
    filename.appendChild(filename_txt)

    path = doc.createElement('path')
    annotation.appendChild(path)
    path_txt = doc.createTextNode(imgpath)
    path.appendChild(path_txt)
    #ones#
    source = doc.createElement('source')
    annotation.appendChild(source)

    database = doc.createElement('database')
    source.appendChild(database)
    database_txt = doc.createTextNode("The R Database")
    database.appendChild(database_txt)
    #onee#
    #twos#
    size = doc.createElement('size')
    annotation.appendChild(size)

    width = doc.createElement('width')
    size.appendChild(width)
    width_txt = doc.createTextNode(str(w))
    width.appendChild(width_txt)

    height = doc.createElement('height')
    size.appendChild(height)
    height_txt = doc.createTextNode(str(h))
    height.appendChild(height_txt)

    depth = doc.createElement('depth')
    size.appendChild(depth)
    depth_txt = doc.createTextNode("3")
    depth.appendChild(depth_txt)
    #twoe#
    segmented = doc.createElement('segmented')
    annotation.appendChild(segmented)
    segmented_txt = doc.createTextNode("0")
    segmented.appendChild(segmented_txt)

    # attributes
    attributes = doc.createElement("attributes")
    annotation.appendChild(attributes)

    for i in range(0,len(attributes_list)):
        #threes#
        attr_new = doc.createElement(attributes_list[i])
        attributes.appendChild(attr_new)
        attr_new_txt = doc.createTextNode(label_list[i])
        attr_new.appendChild(attr_new_txt)
        #threee#
    with open(wxml, "w") as f:
        f.write(doc.toprettyxml(indent = '\t', encoding='utf-8')) 
    f.close()

    # tempfile = tmp + "test.xml"
    # with open(tempfile, "w") as f:
    #     f.write(doc.toprettyxml(indent = '\t', encoding='utf-8'))

    # rewrite = open(tempfile, "r")
    # lines = rewrite.read().split('\n')
    # newlines = lines[1:len(lines)-1]

    # fw = open(wxml, "w")
    # for i in range(0, len(newlines)):
    #     fw.write(newlines[i] + '\n')

    # fw.close()
    # rewrite.close()
    # # os.remove(tempfile)
    return

attributes_list = [
    'Female',
    'AgeLess16',
    'Age17-30',
    'Age31-45',
    'BodyFat',
    'BodyNormal',
    'BodyThin'  
]

# temp = "/Users/data/temp"
# if not os.path.exists(temp):
#    os.mkdir(temp)

f = open(ann_path, 'r')
txt_list = f.readlines()
f.close()
im_name_list = []

for line in txt_list:
    line = line.strip()
    line_split = line.split(' ')
    img_name = line_split[0].split('/')[-1]
    im_name_list.append(img_name)
    label_list = []
    for j in range(1, len(line_split)):
        label_list.append(line_split[j])
    fileimgpath = os.path.join(img_path, img_name)
    im=Image.open(fileimgpath)  
    width= int(im.size[0])
    height= int(im.size[1])
    # print label_list
    savename = os.path.join(xml_path , img_name.split('.')[0] + '.xml')
    writeXml(temp, img_name,fileimgpath, width, height, label_list, savename,attributes_list)
# os.rmdir(temp)

GitHub 加速计划 / la / labelImg

下载

最近提交(Master分支：4 个月前 )

b33f965b Adds information about Label Studio community to welcome LabelImg users 3 年前

2d5537ba 3 年前

AtomGit开源社区

AtomGit 是由开放原子开源基金会联合 CSDN 等生态伙伴共同推出的新一代开源与人工智能协作平台。平台坚持“开放、中立、公益”的理念，把代码托管、模型共享、数据集托管、智能体开发体验和算力服务整合在一起，为开发者提供从开发、训练到部署的一站式体验。

更多推荐

1.8B 体积、33 种语言互译｜腾讯混元 HY-MT1.5-1.8B 多语言机器翻译模型上线

在跨语言交流日益频繁的今天，阅读外语菜单、处理多语言邮件、与不同语言背景的人沟通，已经成为很多人日常工作与生活的一部分。过去，这类需求往往依赖联网翻译工具，而如今，—— 一部设备即可支持的相互翻译。当 AI 不再只是“逐字直译”，而是开始理解语境、风格与语言之间的细微差异，机器翻译就真正具备了今天为大家介绍一款高质量、多语言、支持端侧部署的机器翻译模型 ——，现已上线 AtomGit AI 社区，