Files
bpf-developer-tutorial/scripts/generate_toc.py
github-actions[bot] 342acab9af docs: Update README and SUMMARY files to include Intel NPU kernel driver lessons and cgroup policy control
feat: Enhance TOC generation script to include non-numbered directories with .config files
chore: Add .config file for cgroup-based policy control
2026-01-31 05:55:22 +00:00

330 lines
15 KiB
Python

import os
import re
# Define a function to walk through the directory and generate the TOC structure
def generate_toc(base_dir, project_root, output_file_dir):
toc = "## Table of Contents\n\n"
section_headers = {
"Basic": "### Getting Started Examples\n\nThis section contains simple eBPF program examples and introductions. It primarily utilizes the `eunomia-bpf` framework to simplify development and introduces the basic usage and development process of eBPF.\n\n",
"Advance": "### Advanced Documents and Examples\n\nWe start to build complete eBPF projects mainly based on `libbpf` and combine them with various application scenarios for practical use.\n\n",
"Depth": "### In-Depth Topics\n\nThis section covers advanced topics related to eBPF, including using eBPF programs on Android, possible attacks and defenses using eBPF programs, and complex tracing. Combining the user-mode and kernel-mode aspects of eBPF can bring great power (as well as security risks).\n\n"
}
subsection_titles = {
"Android": "\n\nAndroid:\n\n",
"GPU": "\n\nGPU:\n\n",
"Scheduler": "\n\nScheduler:\n\n",
"Networking": "\n\nNetworking:\n\n",
"Tracing": "\n\nTracing:\n\n",
"Security": "\n\nSecurity:\n\n",
"Features": "\n\nFeatures:\n\n",
"Other": "\nOther:\n\n"
}
subsection_order = ['GPU', 'Scheduler', 'Networking', 'Tracing', 'Security', 'Features', 'Other', 'Android']
# To ensure numeric sorting of directories
def sort_key(directory_name):
return list(map(int, re.findall(r'\d+', directory_name)))
sections = {} # {section_level: {subsection_type: [lessons]}}
# Collect all directories including subdirectories
all_dirs = []
for item in os.listdir(base_dir):
item_path = os.path.join(base_dir, item)
if os.path.isdir(item_path):
# Add numbered directories directly
if re.match(r'^\d+', item):
all_dirs.append(item)
# Also add non-numbered directories that have .config file
elif os.path.exists(os.path.join(item_path, ".config")):
all_dirs.append(item)
# Also scan subdirectories (like features/, xpu/)
else:
for subitem in os.listdir(item_path):
subitem_path = os.path.join(item_path, subitem)
if os.path.isdir(subitem_path):
all_dirs.append(os.path.join(item, subitem))
# Sort directories properly by numeric order (non-numeric dirs go to end)
all_dirs = sorted(all_dirs, key=lambda d: sort_key(d) if re.search(r'\d+', d) else [999999])
# Loop over the sorted directories
for directory in all_dirs:
lesson_path = os.path.join(base_dir, directory)
config_path = os.path.join(lesson_path, ".config")
readme_path = os.path.join(lesson_path, "README.md")
if os.path.exists(config_path) and os.path.exists(readme_path):
# Read the .config file for 'level', 'type', and 'desc'
with open(config_path, 'r') as config_file:
config_lines = config_file.readlines()
level = None
lesson_type = None
desc = None
for line in config_lines:
if line.startswith("level="):
level = line.split("=",1)[1].strip()
elif line.startswith("type="):
lesson_type = line.split("=",1)[1].strip()
elif line.startswith("desc="):
desc = line.split("=",1)[1].strip()
# Extract the first markdown title in README_en.md
with open(readme_path, 'r') as readme_file:
first_title = None
for line in readme_file:
if line.startswith("#"):
first_title = line.strip().lstrip("#").strip()
break
# If title starts with "eBPF", remove the part before the colon
if first_title and first_title.startswith("eBPF"):
if ":" in first_title:
first_title = first_title.split(":", 1)[1].strip()
# Get the relative path for the lesson (relative to the output file's directory)
lesson_rel_path = os.path.relpath(readme_path, output_file_dir)
# Prepare lesson data
# Handle both numbered lessons (e.g., "12-profile") and named lessons (e.g., "features/bpf_arena")
if '-' in os.path.basename(directory):
lesson_number = directory.split('-')[0]
lesson_name = directory.split('-', 1)[1]
link_text = f"lesson {lesson_number}-{lesson_name}"
else:
# For non-numbered directories, use the full path as name
link_text = directory.replace('/', ' ')
link = f"{lesson_rel_path}"
# Use description if available, else use first title
lesson_desc = desc if desc else first_title
lesson_entry = {
'link_text': link_text,
'link': link,
'desc': lesson_desc
}
# Organize lessons into sections and subsections
sections.setdefault(level, {}).setdefault(lesson_type, []).append(lesson_entry)
# Now, output the TOC in the desired order
section_order = ['Basic', 'Advance', 'Depth']
for level in section_order:
if level in sections:
toc += section_headers.get(level, "")
# For Basic and Advance sections, no subsections
if level != 'Depth':
for lesson in sum(sections[level].values(), []): # Flatten the list
toc += f"- [{lesson['link_text']}]({lesson['link']}) {lesson['desc']}\n"
else:
# For Depth section, output subsections in the desired order
for subsection in subsection_order:
if subsection in sections[level]:
toc += subsection_titles.get(subsection, "")
for lesson in sections[level][subsection]:
toc += f"- [{lesson['link_text']}]({lesson['link']}) {lesson['desc']}\n"
toc += "\nContinuously updating..."
return toc
# Define a function to walk through the directory and generate the TOC structure in Chinese
def generate_toc_cn(base_dir, project_root, output_file_dir):
toc = "## 目录\n\n"
section_headers = {
"Basic": "### 入门示例\n\n这一部分包含简单的 eBPF 程序示例和介绍。主要利用 `eunomia-bpf` 框架简化开发,介绍 eBPF 的基本用法和开发流程。\n\n",
"Advance": "### 高级文档和示例\n\n我们开始构建完整的 eBPF 项目,主要基于 `libbpf`,并将其与各种应用场景结合起来,以便实际使用。\n\n",
"Depth": "### 深入主题\n\n这一部分涵盖了与 eBPF 相关的高级主题,包括在 Android 上使用 eBPF 程序、利用 eBPF 程序进行的潜在攻击和防御以及复杂的追踪。结合用户模式和内核模式的 eBPF 可以带来强大的能力(也可能带来安全风险)。\n\n"
}
subsection_titles = {
"Android": "Android:\n\n",
"GPU": "GPU:\n\n",
"Scheduler": "调度器:\n\n",
"Networking": "网络:\n\n",
"tracing": "Tracing:\n\n",
"Security": "安全:\n\n",
"Features": "特性:\n\n",
"Other": "特性:\n\n"
}
subsection_order = ['GPU', 'Scheduler', 'Networking', 'tracing', 'Security', 'Features', 'Other', 'Android']
# To ensure numeric sorting of directories
def sort_key(directory_name):
return list(map(int, re.findall(r'\d+', directory_name)))
sections = {} # {section_level: {subsection_type: [lessons]}}
# Collect all directories including subdirectories
all_dirs = []
for item in os.listdir(base_dir):
item_path = os.path.join(base_dir, item)
if os.path.isdir(item_path):
# Add numbered directories directly
if re.match(r'^\d+', item):
all_dirs.append(item)
# Also add non-numbered directories that have .config file
elif os.path.exists(os.path.join(item_path, ".config")):
all_dirs.append(item)
# Also scan subdirectories (like features/, xpu/)
else:
for subitem in os.listdir(item_path):
subitem_path = os.path.join(item_path, subitem)
if os.path.isdir(subitem_path):
all_dirs.append(os.path.join(item, subitem))
# Sort directories properly by numeric order (non-numeric dirs go to end)
all_dirs = sorted(all_dirs, key=lambda d: sort_key(d) if re.search(r'\d+', d) else [999999])
# Loop over the sorted directories
for directory in all_dirs:
lesson_path = os.path.join(base_dir, directory)
config_path = os.path.join(lesson_path, ".config")
readme_path = os.path.join(lesson_path, "README.zh.md")
if os.path.exists(config_path) and os.path.exists(readme_path):
# Read the .config file for 'level', 'type', and 'desc'
with open(config_path, 'r') as config_file:
config_lines = config_file.readlines()
level = None
lesson_type = None
desc = None
for line in config_lines:
if line.startswith("level="):
level = line.split("=",1)[1].strip()
elif line.startswith("type="):
lesson_type = line.split("=",1)[1].strip()
elif line.startswith("desc="):
desc = line.split("=",1)[1].strip()
# Extract the first markdown title in README.md
with open(readme_path, 'r') as readme_file:
first_title = None
for line in readme_file:
if line.startswith("#"):
first_title = line.strip().lstrip("#").strip()
break
# If title starts with "eBPF", remove the part before the colon
if first_title and first_title.startswith("eBPF"):
if ":" in first_title:
first_title = first_title.split(":", 1)[1].strip()
# Get the relative path for the lesson (relative to the output file's directory)
lesson_rel_path = os.path.relpath(readme_path, output_file_dir)
# Prepare lesson data
# Handle both numbered lessons (e.g., "12-profile") and named lessons (e.g., "features/bpf_arena")
if '-' in os.path.basename(directory):
lesson_number = directory.split('-')[0]
lesson_name = directory.split('-', 1)[1]
link_text = f"lesson {lesson_number}-{lesson_name}"
else:
# For non-numbered directories, use the full path as name
link_text = directory.replace('/', ' ')
link = f"{lesson_rel_path}"
# Use description if available, else use first title
lesson_desc = desc if desc else first_title
lesson_entry = {
'link_text': link_text,
'link': link,
'desc': lesson_desc
}
# Organize lessons into sections and subsections
sections.setdefault(level, {}).setdefault(lesson_type, []).append(lesson_entry)
# Now, output the TOC in the desired order
section_order = ['Basic', 'Advance', 'Depth']
for level in section_order:
if level in sections:
toc += section_headers.get(level, "")
# For Basic and Advance sections, no subsections
if level != 'Depth':
for lesson in sum(sections[level].values(), []): # Flatten the list
toc += f"- [{lesson['link_text']}]({lesson['link']}) {lesson['desc']}\n"
else:
# For Depth section, output subsections in the desired order
for subsection in subsection_order:
if subsection in sections[level]:
toc += subsection_titles.get(subsection, "")
for lesson in sections[level][subsection]:
toc += f"- [{lesson['link_text']}]({lesson['link']}) {lesson['desc']}\n"
toc += "\n持续更新中..."
return toc
def load_template(template_path):
"""Load a template file and return its content"""
with open(template_path, 'r', encoding='utf-8') as f:
return f.read()
def generate_file_from_template(template_path, output_path, toc_content):
"""Generate a file from template by replacing {{TOC_CONTENT}} placeholder"""
template = load_template(template_path)
output_content = template.replace('{{TOC_CONTENT}}', toc_content)
with open(output_path, 'w', encoding='utf-8') as f:
f.write(output_content)
print(f"Generated: {output_path}")
# Main execution
if __name__ == "__main__":
# Get the absolute path to the script's directory
script_dir = os.path.dirname(os.path.abspath(__file__))
# Get the project root (parent of scripts directory)
project_root = os.path.dirname(script_dir)
base_directory = os.path.join(project_root, "src")
scripts_dir = os.path.join(project_root, "scripts")
# Generate TOC content for SUMMARY.md files (output in src/ directory)
toc_summary_en = generate_toc(base_directory, project_root, os.path.join(project_root, 'src'))
toc_summary_cn = generate_toc_cn(base_directory, project_root, os.path.join(project_root, 'src'))
# Generate TOC content for README.md files (output in project root)
toc_readme_en = generate_toc(base_directory, project_root, project_root)
toc_readme_cn = generate_toc_cn(base_directory, project_root, project_root)
# Generate SUMMARY.md from template
generate_file_from_template(
os.path.join(scripts_dir, 'SUMMARY.md.template'),
os.path.join(project_root, 'src', 'SUMMARY.md'),
toc_summary_en
)
# Generate SUMMARY.zh.md from template
generate_file_from_template(
os.path.join(scripts_dir, 'SUMMARY.zh.md.template'),
os.path.join(project_root, 'src', 'SUMMARY.zh.md'),
toc_summary_cn
)
# Generate README.md from template
generate_file_from_template(
os.path.join(scripts_dir, 'README.md.template'),
os.path.join(project_root, 'README.md'),
toc_readme_en
)
# Generate README.zh.md from template
generate_file_from_template(
os.path.join(scripts_dir, 'README.zh.md.template'),
os.path.join(project_root, 'README.zh.md'),
toc_readme_cn
)
print("\nAll files generated successfully!")