Fresh export of all 20 diagrams as PNG and full HTML documentation site after the Grand Unification UML sync. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
618 lines
19 KiB
HTML
618 lines
19 KiB
HTML
<!DOCTYPE html>
|
|
<html>
|
|
<head>
|
|
<meta charset="UTF-8">
|
|
<title>UnifiedScraper</title>
|
|
<link href='http://fonts.googleapis.com/css?family=Source+Sans+Pro:300,400,700,300italic,400italic,700italic|Source+Code+Pro:300,400,700' rel='stylesheet' type='text/css'>
|
|
<link rel="stylesheet" href="../assets/css/bootstrap.css">
|
|
<link rel="stylesheet" href="../assets/css/jquery.bonsai.css">
|
|
<link rel="stylesheet" href="../assets/css/main.css">
|
|
<link rel="stylesheet" href="../assets/icon-font/icons.css">
|
|
<script type="text/javascript" src="../assets/js/jquery-2.1.0.min.js"></script>
|
|
<script type="text/javascript" src="../assets/js/bootstrap.js"></script>
|
|
<script type="text/javascript" src="../assets/js/jquery.bonsai.js"></script>
|
|
<script type="text/javascript" src="../assets/js/imageMapResizer.min.js"></script>
|
|
|
|
</head>
|
|
<body>
|
|
<div>
|
|
|
|
<!-- Name Title -->
|
|
|
|
<h1>UnifiedScraper</h1>
|
|
|
|
<!-- Type and Stereotype -->
|
|
|
|
<section style="margin-top: .5em;">
|
|
<span class="alert alert-info">
|
|
<span class="node-icon staruml-icon icon-UMLClass"></span>
|
|
UMLClass
|
|
</span>
|
|
|
|
</section>
|
|
|
|
<!-- Path -->
|
|
|
|
<section style="margin-top: 10px">
|
|
|
|
|
|
|
|
|
|
<span class="label label-info"><a href='cf9c8b720f3815adeccaf3ef6e48c6c4.html'><span class='node-icon staruml-icon icon-Project'></span>Skill Seekers</a></span>
|
|
|
|
<span>::</span>
|
|
<span class="label label-info"><a href='6a4361334e8b649314ed681b9e6798c3.html'><span class='node-icon staruml-icon icon-UMLModel'></span>skill_seekers</a></span>
|
|
|
|
<span>::</span>
|
|
<span class="label label-info"><a href='9a6a2c65f0fecfbf94214fe5dacc11b2.html'><span class='node-icon staruml-icon icon-UMLPackage'></span>Scrapers</a></span>
|
|
|
|
<span>::</span>
|
|
<span class="label label-info"><a href='b1cc179750d7478da42c374e551b414d.html'><span class='node-icon staruml-icon icon-UMLClass'></span>UnifiedScraper</a></span>
|
|
|
|
</section>
|
|
|
|
<!-- Diagram -->
|
|
|
|
|
|
|
|
<!-- Description -->
|
|
|
|
|
|
<section>
|
|
<h3>Description</h3>
|
|
<div>
|
|
|
|
<p>Orchestrates multi-source skill building from a unified config JSON. Dispatches to 17 source-type scrapers, detects conflicts between sources, merges data (rule-based or claude-enhanced), and produces a single combined skill. Source: unified_scraper.py</p>
|
|
|
|
</div>
|
|
</section>
|
|
|
|
|
|
<!-- Specification -->
|
|
|
|
|
|
|
|
<!-- Directed Relationship -->
|
|
|
|
|
|
|
|
<!-- Undirected Relationship -->
|
|
|
|
|
|
|
|
<!-- Classifier -->
|
|
|
|
|
|
|
|
|
|
<section class="element-list">
|
|
<h3>Generalized Elements</h3>
|
|
<ul class="nav nav-list">
|
|
|
|
<li><a href='a41818884a205b0bf873ee45b258004c.html'><span class='node-icon staruml-icon icon-UMLClass'></span>SkillConverter</a></li>
|
|
|
|
</ul>
|
|
</section>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<!-- Interface -->
|
|
|
|
|
|
|
|
<!-- Component -->
|
|
|
|
|
|
|
|
<!-- Node -->
|
|
|
|
|
|
|
|
<!-- Actor -->
|
|
|
|
|
|
|
|
<!-- Use Case -->
|
|
|
|
|
|
|
|
<!-- Template Parameters -->
|
|
|
|
|
|
|
|
<!-- Literals -->
|
|
|
|
|
|
|
|
<!-- Attributes -->
|
|
|
|
|
|
<section>
|
|
<h3>Attributes</h3>
|
|
<table class="table table-striped table-bordered">
|
|
<tr>
|
|
<th>Visibility</th>
|
|
<th>Name</th>
|
|
<th>Type</th>
|
|
<th>Description</th>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="2b54f4b5c843614daa3b8b3ba8b4193e.html">config_path</a></td>
|
|
<td>str </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="f4db861e5abb6fe26e3a5557cc57811a.html">config</a></td>
|
|
<td>dict </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="2e25208e715d59436de44b27a44ac697.html">merge_mode</a></td>
|
|
<td>str </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="5f0fc8c9a8d68e2d81f1ae09f555f3c2.html">scraped_data</a></td>
|
|
<td>dict </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="f1dffaabd9e26930bf0ec66d2746e373.html">name</a></td>
|
|
<td>str </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>private</td>
|
|
<td><a href="253f8b544aea98e0c2ec579722ea8bd6.html">output_dir</a></td>
|
|
<td>str </td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
</table>
|
|
</section>
|
|
|
|
|
|
<!-- Operations -->
|
|
|
|
|
|
<section>
|
|
<h3>Operations</h3>
|
|
<table class="table table-striped table-bordered">
|
|
<tr>
|
|
<th>Visibility</th>
|
|
<th>Name</th>
|
|
<th>Description</th>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="14ed62b4bedb9fd3fecedd2603cd2749.html">scrape_all_sources()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="53c2f510b0b84df0598d832ceee2ae2e.html">merge_sources()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="c1ede8d083a70c77c766dd303ac629e1.html">scrape_all_sources()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="6fcb0bd02ed0c787a074ac9345cde8f0.html">detect_conflicts()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="fad2645b8ec341002a3f764ccbb6dd7b.html">merge_sources()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="42a937886ad1e7416759df5800be9246.html">build_skill()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
<tr>
|
|
<td>public</td>
|
|
<td><a href="405e3ec539575c992453f2c096d860b8.html">run()</a></td>
|
|
<td></td>
|
|
</tr>
|
|
|
|
</table>
|
|
</section>
|
|
|
|
|
|
<!-- Receptions -->
|
|
|
|
|
|
|
|
<!-- Extension Points -->
|
|
|
|
|
|
|
|
<!-- Parameters -->
|
|
|
|
|
|
|
|
<!-- Diagrams -->
|
|
|
|
|
|
|
|
|
|
<!-- Behavior -->
|
|
|
|
|
|
|
|
<!-- Action -->
|
|
|
|
|
|
|
|
<!-- Interaction -->
|
|
|
|
|
|
|
|
<!-- CombinedFragment -->
|
|
|
|
|
|
|
|
<!-- Activity -->
|
|
|
|
|
|
|
|
<!-- State Machine -->
|
|
|
|
|
|
|
|
<!-- State Machine -->
|
|
|
|
|
|
|
|
<!-- State -->
|
|
|
|
|
|
|
|
<!-- Vertex -->
|
|
|
|
|
|
|
|
<!-- Transition -->
|
|
|
|
|
|
|
|
<!-- Data Model (ERD) -->
|
|
|
|
|
|
|
|
<!-- Columns (ERD) -->
|
|
|
|
|
|
|
|
<!-- Related Entities (ERD) -->
|
|
|
|
|
|
|
|
<!-- Data Flows (DFD) -->
|
|
|
|
|
|
|
|
<!-- Flows (Flowchart) -->
|
|
|
|
|
|
|
|
<!-- Properties -->
|
|
|
|
<section>
|
|
<h3>Properties</h3>
|
|
|
|
<table class="table table-striped table-bordered">
|
|
<tr>
|
|
<th width="50%">Name</th>
|
|
<th width="50%">Value</th>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>name</td>
|
|
<td>UnifiedScraper</td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>stereotype</td>
|
|
<td><span class='label label-info'>null</span></td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>visibility</td>
|
|
<td>public</td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>isAbstract</td>
|
|
<td><span class='label label-info'>false</span></td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>isFinalSpecialization</td>
|
|
<td><span class='label label-info'>false</span></td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>isLeaf</td>
|
|
<td><span class='label label-info'>false</span></td>
|
|
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
<tr>
|
|
<td>isActive</td>
|
|
<td><span class='label label-info'>false</span></td>
|
|
</tr>
|
|
|
|
|
|
|
|
</table>
|
|
|
|
</section>
|
|
|
|
<!-- Tags -->
|
|
|
|
|
|
|
|
<!-- Constraints, Dependencies, Dependants -->
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<section class="element-list">
|
|
<h3>Dependencies</h3>
|
|
<ul class="nav nav-list">
|
|
|
|
<li><a href='3af5ea4716a6bdcdb5593eb62d9fe016.html'><span class='node-icon staruml-icon icon-UMLClass'></span>DocToSkillConverter</a></li>
|
|
|
|
<li><a href='f821b72afc0c59329dd76d9eb0aa9780.html'><span class='node-icon staruml-icon icon-UMLClass'></span>GitHubScraper</a></li>
|
|
|
|
<li><a href='19fafbea28e5d5f773d66b64b077ad83.html'><span class='node-icon staruml-icon icon-UMLClass'></span>GitHubToSkillConverter</a></li>
|
|
|
|
<li><a href='f404e5b8c71d89b9a74f9b872351ff0d.html'><span class='node-icon staruml-icon icon-UMLClass'></span>PDFToSkillConverter</a></li>
|
|
|
|
<li><a href='02231b18c56eee1fe00db0b3cc88d3f3.html'><span class='node-icon staruml-icon icon-UMLClass'></span>WordToSkillConverter</a></li>
|
|
|
|
<li><a href='d17d20c49ea8b49688427e3f2da2a5de.html'><span class='node-icon staruml-icon icon-UMLClass'></span>VideoToSkillConverter</a></li>
|
|
|
|
<li><a href='50c94d49c4f3c594d8dd4cb8c67e2b7c.html'><span class='node-icon staruml-icon icon-UMLClass'></span>EpubToSkillConverter</a></li>
|
|
|
|
<li><a href='1da40a6efac2b652728d1d5516dbc700.html'><span class='node-icon staruml-icon icon-UMLClass'></span>JupyterToSkillConverter</a></li>
|
|
|
|
<li><a href='975393f28febd506c6f9a4bdd7d02929.html'><span class='node-icon staruml-icon icon-UMLClass'></span>HtmlToSkillConverter</a></li>
|
|
|
|
<li><a href='5c7b162d10d20fa81377595dee3cb625.html'><span class='node-icon staruml-icon icon-UMLClass'></span>OpenAPIToSkillConverter</a></li>
|
|
|
|
<li><a href='e8fa4d95e76893b117bcc6f54753011c.html'><span class='node-icon staruml-icon icon-UMLClass'></span>AsciiDocToSkillConverter</a></li>
|
|
|
|
<li><a href='d151f121325ce00a55de3cfa14df0780.html'><span class='node-icon staruml-icon icon-UMLClass'></span>PptxToSkillConverter</a></li>
|
|
|
|
<li><a href='78badaff41241c07ff29c19231333ae4.html'><span class='node-icon staruml-icon icon-UMLClass'></span>RssToSkillConverter</a></li>
|
|
|
|
<li><a href='606976142b92c30df8a10a398571f41c.html'><span class='node-icon staruml-icon icon-UMLClass'></span>ManPageToSkillConverter</a></li>
|
|
|
|
<li><a href='7a7a8d9d20d00f70db88f89eefdee448.html'><span class='node-icon staruml-icon icon-UMLClass'></span>ConfluenceToSkillConverter</a></li>
|
|
|
|
<li><a href='a4606a82fa614707056585bc7b11c66b.html'><span class='node-icon staruml-icon icon-UMLClass'></span>NotionToSkillConverter</a></li>
|
|
|
|
<li><a href='be653f12dac76fd779cd14c40bc893b1.html'><span class='node-icon staruml-icon icon-UMLClass'></span>ChatToSkillConverter</a></li>
|
|
|
|
</ul>
|
|
</section>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
<!-- Relationships -->
|
|
|
|
|
|
|
|
<section class="element-list">
|
|
<h3>Relationships</h3>
|
|
<ul class="nav nav-list">
|
|
|
|
<li><a href='138fdc81880d347a9f7353f299ae298b.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«subprocess» (UnifiedScraper→DocToSkillConverter)</a></li>
|
|
|
|
<li><a href='953c03c8f244268e76b315cd784ce857.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→GitHubScraper)</a></li>
|
|
|
|
<li><a href='1f6fa1dbd7ebaf633e35b49b9555bd33.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→GitHubToSkillConverter)</a></li>
|
|
|
|
<li><a href='324032f1575138205edf628e46d0039a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→PDFToSkillConverter)</a></li>
|
|
|
|
<li><a href='3359340e9f06e544c06382103b6667df.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→WordToSkillConverter)</a></li>
|
|
|
|
<li><a href='d95939a853affe6c79ab0c3fd7d3a6eb.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→VideoToSkillConverter)</a></li>
|
|
|
|
<li><a href='68349bca69c1c7b57895f50233175342.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→EpubToSkillConverter)</a></li>
|
|
|
|
<li><a href='6bdfa7111970adf2c8322b42516202db.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→JupyterToSkillConverter)</a></li>
|
|
|
|
<li><a href='0af0718934b7c9bf0704b33c6edceb0a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→HtmlToSkillConverter)</a></li>
|
|
|
|
<li><a href='63bdd9a1ed32573d420b74add866fc74.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→OpenAPIToSkillConverter)</a></li>
|
|
|
|
<li><a href='d334f298a53420077a037f8e03761d51.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→AsciiDocToSkillConverter)</a></li>
|
|
|
|
<li><a href='f9655092d3df6e9efdb98c0e59e25ab3.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→PptxToSkillConverter)</a></li>
|
|
|
|
<li><a href='d473e1f5dca164ccf643cfc2437c6eb4.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→RssToSkillConverter)</a></li>
|
|
|
|
<li><a href='61efc38c4515bced685b1a983308aa41.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ManPageToSkillConverter)</a></li>
|
|
|
|
<li><a href='ce9f1d2d8b56223ff3ed921ce087eed4.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ConfluenceToSkillConverter)</a></li>
|
|
|
|
<li><a href='6a25496164773bffdf9c3bc30c9b50bc.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→NotionToSkillConverter)</a></li>
|
|
|
|
<li><a href='690011eb8eb436df4bc3e93dc95d063a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ChatToSkillConverter)</a></li>
|
|
|
|
<li><a href='aa6ab8441c635ce955bc904b6cc64d4f.html'><span class='node-icon staruml-icon icon-UMLGeneralization'></span>(UnifiedScraper→SkillConverter)</a></li>
|
|
|
|
</ul>
|
|
</section>
|
|
|
|
|
|
|
|
<!-- Owned Elements -->
|
|
|
|
|
|
|
|
<section class="element-list">
|
|
<h3>Owned Elements</h3>
|
|
<ul class="nav nav-list">
|
|
|
|
<li><a href='138fdc81880d347a9f7353f299ae298b.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«subprocess» (UnifiedScraper→DocToSkillConverter)</a></li>
|
|
|
|
<li><a href='953c03c8f244268e76b315cd784ce857.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→GitHubScraper)</a></li>
|
|
|
|
<li><a href='1f6fa1dbd7ebaf633e35b49b9555bd33.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→GitHubToSkillConverter)</a></li>
|
|
|
|
<li><a href='324032f1575138205edf628e46d0039a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→PDFToSkillConverter)</a></li>
|
|
|
|
<li><a href='3359340e9f06e544c06382103b6667df.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→WordToSkillConverter)</a></li>
|
|
|
|
<li><a href='d95939a853affe6c79ab0c3fd7d3a6eb.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→VideoToSkillConverter)</a></li>
|
|
|
|
<li><a href='68349bca69c1c7b57895f50233175342.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→EpubToSkillConverter)</a></li>
|
|
|
|
<li><a href='6bdfa7111970adf2c8322b42516202db.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→JupyterToSkillConverter)</a></li>
|
|
|
|
<li><a href='0af0718934b7c9bf0704b33c6edceb0a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→HtmlToSkillConverter)</a></li>
|
|
|
|
<li><a href='63bdd9a1ed32573d420b74add866fc74.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→OpenAPIToSkillConverter)</a></li>
|
|
|
|
<li><a href='d334f298a53420077a037f8e03761d51.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→AsciiDocToSkillConverter)</a></li>
|
|
|
|
<li><a href='f9655092d3df6e9efdb98c0e59e25ab3.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→PptxToSkillConverter)</a></li>
|
|
|
|
<li><a href='d473e1f5dca164ccf643cfc2437c6eb4.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→RssToSkillConverter)</a></li>
|
|
|
|
<li><a href='61efc38c4515bced685b1a983308aa41.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ManPageToSkillConverter)</a></li>
|
|
|
|
<li><a href='ce9f1d2d8b56223ff3ed921ce087eed4.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ConfluenceToSkillConverter)</a></li>
|
|
|
|
<li><a href='6a25496164773bffdf9c3bc30c9b50bc.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→NotionToSkillConverter)</a></li>
|
|
|
|
<li><a href='690011eb8eb436df4bc3e93dc95d063a.html'><span class='node-icon staruml-icon icon-UMLDependency'></span>«import» (UnifiedScraper→ChatToSkillConverter)</a></li>
|
|
|
|
<li><a href='aa6ab8441c635ce955bc904b6cc64d4f.html'><span class='node-icon staruml-icon icon-UMLGeneralization'></span>(UnifiedScraper→SkillConverter)</a></li>
|
|
|
|
</ul>
|
|
</section>
|
|
|
|
|
|
|
|
<!-- Diagrams -->
|
|
|
|
|
|
|
|
<section class="element-list">
|
|
<h3>Diagrams</h3>
|
|
<ul class="nav nav-list">
|
|
|
|
<li><a href='a47184837219aea9ccabc89e35d90216.html'><span class='node-icon staruml-icon icon-UMLClassDiagram'></span>Scrapers</a></li>
|
|
|
|
</ul>
|
|
</section>
|
|
|
|
|
|
|
|
|
|
<!-- Image Map Resizer (https://github.com/davidjbradshaw/image-map-resizer) -->
|
|
<script>
|
|
imageMapResize();
|
|
</script>
|
|
</div>
|
|
</body>
|
|
</html>
|