Read and parse XML from construction systems - P6 schedules, BSDD exports, IFC-XML, COBie-XML. Convert to pandas DataFrames.
数据来源:ClawHub。 在 ClawSkills 查看
选择你使用的 Agent
方法一:命令行安装(推荐)
推荐(无需提前安装 clawhub)
npx clawhub@latest --dir ~/.claude/skills install xml-reader或使用 clawhub CLI(需提前安装)
clawhub --dir ~/.claude/skills install xml-reader⚠️ 需要 Node.js 18+,没有 Node?请使用下方方法二直接下载 ZIP。 安装 Node.js →
方法二:手动下载安装(无需 Node)
下载 ZIP,解压后将文件夹放到以下路径,重启 Agent 即可:
安装路径
~/.claude/skills/xml-reader/💡解压后将文件夹放到上方路径,重启 Agent 即可生效
--- name: "xml-reader" description: "Read and parse XML from construction systems - P6 schedules, BSDD exports, IFC-XML, COBie-XML. Convert to pandas DataFrames." homepage: "https://datadrivenconstruction.io" metadata: {"openclaw": {"emoji": "🏷️", "os": ["darwin", "linux", "win32"], "homepage": "https://datadrivenconstruction.io", "requires": {"bins": ["python3"]}}} ---
XML is used in construction for P6 schedules (XER), IFC-XML, COBie-XML, and buildingSMART Data Dictionary exports. This skill parses XML and converts to structured DataFrames.
import xml.etree.ElementTree as ET
import pandas as pd
from typing import Dict, Any, List, Optional, Union
from dataclasses import dataclass
from pathlib import Path
import re
@dataclass
class XMLElement:
"""Parsed XML element."""
tag: str
attributes: Dict[str, str]
text: Optional[str]
children: List['XMLElement']
class ConstructionXMLReader:
"""Parse XML from construction systems."""
def __init__(self):
self.namespaces: Dict[str, str] = {}
def parse_file(self, file_path: str) -> ET.Element:
"""Parse XML file and return root element."""
tree = ET.parse(file_path)
root = tree.getroot()
# Extract namespaces
self._extract_namespaces(root)
return root
def parse_string(self, xml_string: str) -> ET.Element:
"""Parse XML from string."""
root = ET.fromstring(xml_string)
self._extract_namespaces(root)
return root
def _extract_namespaces(self, root: ET.Element):
"""Extract namespace mappings."""
# Find namespace declarations
for attr, value in root.attrib.items():
if attr.startswith('{'):
ns = attr[1:attr.index('}')]
self.namespaces[root.tag.split('}')[0][1:]] = ns
def find_elements(self, root: ET.Element,
tag: str,
namespace: str = None) -> List[ET.Element]:
"""Find all elements with given tag."""
if namespace:
tag = f"{{{namespace}}}{tag}"
return root.findall(f".//{tag}")
def element_to_dict(self, element: ET.Element,
include_children: bool = True) -> Dict[str, Any]:
"""Convert element to dictionary."""
result = {
'_tag': element.tag.split('}')[-1] if '}' in element.tag else element.tag,
'_text': element.text.strip() if element.text else None,
**element.attrib
}
if include_children:
for child in element:
child_tag = child.tag.split('}')[-1] if '}' in child.tag else child.tag
if child_tag in result:
# Multiple children with same tag - make list
if not isinstance(result[child_tag], list):
result[child_tag] = [result[child_tag]]
result[child_tag].append(self.element_to_dict(child))
else:
result[child_tag] = self.element_to_dict(child)
return result
def elements_to_dataframe(self, elements: List[ET.Element]) -> pd.DataFrame:
"""Convert list of elements to DataFrame."""
records = []
for elem in elements:
record = {'_tag': elem.tag.split('}')[-1]}
record.update(elem.attrib)
# Get direct text content
if elem.text and elem.text.strip():
record['_text'] = elem.text.strip()
# Get child values
for child in elem:
child_tag = child.tag.split('}')[-1]
if child.text and child.text.strip():
record[child_tag] = child.text.strip()
# Also get child attributes
for attr, val in child.attrib.items():
record[f"{child_tag}_{attr}"] = val
records.append(record)
return pd.DataFrame(records)
def flatten_xml(self, root: ET.Element,
target_tag: str = None) -> pd.DataFrame:
"""Flatten XML to DataFrame."""
if target_tag:
elements = self.find_elements(root, target_tag)
else:
elements = list(root)
return self.elements_to_dataframe(elements)
class P6XMLReader(ConstructionXMLReader):
"""Reader for Primavera P6 XML exports."""
def parse_activities(self, root: ET.Element) -> pd.DataFrame:
"""Parse activities from P6 XML."""
activities = self.find_elements(root, 'Activity')
return self.elements_to_dataframe(activities)
def parse_resources(self, root: ET.Element) -> pd.DataFrame:
"""Parse resources from P6 XML."""
resources = self.find_elements(root, 'Resource')
return self.elements_to_dataframe(resources)
def parse_wbs(self, root: ET.Element) -> pd.DataFrame:
"""Parse WBS from P6 XML."""
wbs = self.find_elements(root, 'WBS')
return self.elements_to_dataframe(wbs)
def parse_full_schedule(self, file_path: str) -> Dict[str, pd.DataFrame]:
"""Parse complete P6 schedule."""
root = self.parse_file(file_path)
return {
'activities': self.parse_activities(root),
'resources': self.parse_resources(root),
'wbs': self.parse_wbs(root)
}
class IFCXMLReader(ConstructionXMLReader):
"""Reader for IFC-XML files."""
def parse_entities(self, root: ET.Element) -> pd.DataFrame:
"""Parse IFC entities."""
# Find all Ifc* elements
all_entities = []
for elem in root.iter():
if elem.tag.startswith('Ifc'):
all_entities.append(elem)
return self.elements_to_dataframe(all_entities)
def get_entity_types(self, root: ET.Element) -> Dict[str, int]:
"""Count entity types."""
counts = {}
for elem in root.iter():
tag = elem.tag
if tag.startswith('Ifc'):
counts[tag] = counts.get(tag, 0) + 1
return counts
class COBieXMLReader(ConstructionXMLReader):
"""Reader for COBie XML files."""
COBIE_SHEETS = ['Facility', 'Floor', 'Space', 'Zone', 'Type',
'Component', 'System', 'Assembly', 'Connection',
'Spare', 'Resource', 'Job', 'Document', 'Attribute']
def parse_cobie(self, file_path: str) -> Dict[str, pd.DataFrame]:
"""Parse all COBie sheets."""
root = self.parse_file(file_path)
result = {}
for sheet in self.COBIE_SHEETS:
elements = self.find_elements(root, sheet)
if elements:
result[sheet] = self.elements_to_dataframe(elements)
return result
class BSDDXMLReader(ConstructionXMLReader):
"""Reader for buildingSMART Data Dictionary exports."""
def parse_classifications(self, root: ET.Element) -> pd.DataFrame:
"""Parse classification items."""
items = self.find_elements(root, 'Classification')
return self.elements_to_dataframe(items)
def parse_properties(self, root: ET.Element) -> pd.DataFrame:
"""Parse property definitions."""
props = self.find_elements(root, 'Property')
return self.elements_to_dataframe(props)
reader = ConstructionXMLReader()
# Parse XML file
root = reader.parse_file("schedule.xml")
# Find specific elements
activities = reader.find_elements(root, "Activity")
print(f"Found {len(activities)} activities")
# Convert to DataFrame
df = reader.elements_to_dataframe(activities)
p6_reader = P6XMLReader()
...安装 Xml Reader 后,可以对 AI 说这些话来触发它
Help me get started with Xml Reader
Explains what Xml Reader does, walks through the setup, and runs a quick demo based on your current project
Use Xml Reader to read and parse XML from construction systems - P6 schedules, BSDD e...
Invokes Xml Reader with the right parameters and returns the result directly in the conversation
What can I do with Xml Reader in my documents & notes workflow?
Lists the top use cases for Xml Reader, with example commands for each scenario
将技能文件夹放到 ~/.claude/skills/xml-reader/ 目录(个人级,所有项目可用),或 .claude/skills/xml-reader/(项目级)。重启 AI 客户端后,用 /xml-reader 主动调用,或让 AI 根据上下文自动发现并使用。
Xml Reader 支持 Claude、Cursor、OpenClaw,可与这些 AI 平台无缝集成,扩展其能力。
Xml Reader 可免费安装使用。请查阅仓库了解许可证信息。
Read and parse XML from construction systems - P6 schedules, BSDD exports, IFC-XML, COBie-XML. Convert to pandas DataFrames.
Xml Reader 属于「Documents & Notes」分类,该分类的技能帮助 AI 智能体在此领域执行专业任务。
Automate my documents & notes tasks using Xml Reader
Identifies repetitive steps in your workflow and sets up Xml Reader to handle them automatically