yusufkaraaslan
diff --git a/‎AGENTS.md‎
Lines changed: 24 additions & 50 deletions b/‎AGENTS.md‎
Lines changed: 24 additions & 50 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 9 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎src/skill_seekers/cli/arguments/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎src/skill_seekers/cli/arguments/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎src/skill_seekers/cli/arguments/create.py‎
Lines changed: 19 additions & 1 deletion b/‎src/skill_seekers/cli/arguments/create.py‎
Lines changed: 19 additions & 1 deletion
diff --git a/‎src/skill_seekers/cli/arguments/word.py‎
Lines changed: 66 additions & 0 deletions b/‎src/skill_seekers/cli/arguments/word.py‎
Lines changed: 66 additions & 0 deletions
@@ -12,10 +12,12 @@ This file provides essential guidance for AI coding agents working with the Skil
 
 | Attribute | Value |
 |-----------|-------|
-| **Current Version** | 3.0.0 |
+| **Current Version** | 3.1.3 |
 | **Python Version** | 3.10+ (tested on 3.10, 3.11, 3.12, 3.13) |
 | **License** | MIT |
 | **Package Name** | `skill-seekers` (PyPI) |
+| **Source Files** | 169 Python files |
+| **Test Files** | 101 test files |
 | **Website** | https://skillseekersweb.com/ |
 | **Repository** | https://github.com/yusufkaraaslan/Skill_Seekers |
 
@@ -55,7 +57,7 @@ This file provides essential guidance for AI coding agents working with the Skil
 ```
 /mnt/1ece809a-2821-4f10-aecb-fcdf34760c0b/Git/Skill_Seekers/
 ├── src/skill_seekers/              # Main source code (src/ layout)
-│   ├── cli/                        # CLI tools and commands (~42k lines)
+│   ├── cli/                        # CLI tools and commands (~70 modules)
 │   │   ├── adaptors/               # Platform adaptors (Strategy pattern)
 │   │   │   ├── base.py             # Abstract base class (SkillAdaptor)
 │   │   │   ├── claude.py           # Claude AI adaptor
@@ -70,12 +72,6 @@ This file provides essential guidance for AI coding agents working with the Skil
 │   │   │   ├── qdrant.py           # Qdrant vector DB adaptor
 │   │   │   ├── weaviate.py         # Weaviate vector DB adaptor
 │   │   │   └── streaming_adaptor.py # Streaming output adaptor
-│   │   ├── storage/                # Cloud storage backends
-│   │   │   ├── base_storage.py     # Storage interface
-│   │   │   ├── s3_storage.py       # AWS S3 support
-│   │   │   ├── gcs_storage.py      # Google Cloud Storage
-│   │   │   └── azure_storage.py    # Azure Blob Storage
-│   │   ├── parsers/                # CLI argument parsers
 │   │   ├── arguments/              # CLI argument definitions
 │   │   ├── presets/                # Preset configuration management
 │   │   ├── main.py                 # Unified CLI entry point
@@ -85,6 +81,7 @@ This file provides essential guidance for AI coding agents working with the Skil
 │   │   ├── pdf_scraper.py          # PDF extraction
 │   │   ├── unified_scraper.py      # Multi-source scraping
 │   │   ├── codebase_scraper.py     # Local codebase analysis
+│   │   ├── enhance_command.py      # AI enhancement command
 │   │   ├── enhance_skill_local.py  # AI enhancement (local mode)
 │   │   ├── package_skill.py        # Skill packager
 │   │   ├── upload_skill.py         # Upload to platforms
@@ -101,8 +98,8 @@ This file provides essential guidance for AI coding agents working with the Skil
 │   │   ├── source_manager.py       # Config source management
 │   │   └── tools/                  # MCP tool implementations
 │   │       ├── config_tools.py     # Configuration tools
-│   │       ├── scraping_tools.py   # Scraping tools
 │   │       ├── packaging_tools.py  # Packaging tools
+│   │       ├── scraping_tools.py   # Scraping tools
 │   │       ├── source_tools.py     # Source management tools
 │   │       ├── splitting_tools.py  # Config splitting tools
 │   │       ├── vector_db_tools.py  # Vector database tools
@@ -124,7 +121,7 @@ This file provides essential guidance for AI coding agents working with the Skil
 │   ├── workflows/                  # YAML workflow presets
 │   ├── _version.py                 # Version information (reads from pyproject.toml)
 │   └── __init__.py                 # Package init
-├── tests/                          # Test suite (98 test files)
+├── tests/                          # Test suite (101 test files)
 ├── configs/                        # Preset configuration files
 ├── docs/                           # Documentation (80+ markdown files)
 │   ├── integrations/               # Platform integration guides
@@ -134,17 +131,6 @@ This file provides essential guidance for AI coding agents working with the Skil
 │   ├── blog/                       # Blog posts
 │   └── roadmap/                    # Roadmap documents
 ├── examples/                       # Usage examples
-│   ├── langchain-rag-pipeline/     # LangChain example
-│   ├── llama-index-query-engine/   # LlamaIndex example
-│   ├── pinecone-upsert/            # Pinecone example
-│   ├── chroma-example/             # Chroma example
-│   ├── weaviate-example/           # Weaviate example
-│   ├── qdrant-example/             # Qdrant example
-│   ├── faiss-example/              # FAISS example
-│   ├── haystack-pipeline/          # Haystack example
-│   ├── cursor-react-skill/         # Cursor IDE example
-│   ├── windsurf-fastapi-context/   # Windsurf example
-│   └── continue-dev-universal/     # Continue.dev example
 ├── .github/workflows/              # CI/CD workflows
 ├── pyproject.toml                  # Main project configuration
 ├── requirements.txt                # Pinned dependencies
@@ -259,7 +245,7 @@ pytest tests/ -v -m "not slow and not integration"
 
 ### Test Architecture
 
-- **98 test files** covering all features
+- **101 test files** covering all features
 - **1880+ tests** passing
 - CI Matrix: Ubuntu + macOS, Python 3.10-3.12
 - Test markers defined in `pyproject.toml`:
@@ -316,22 +302,19 @@ mypy src/skill_seekers --show-error-codes --pretty
 - **Ignored rules:** E501, F541, ARG002, B007, I001, SIM114
 - **Import sorting:** isort style with `skill_seekers` as first-party
 
-### MyPy Configuration (from mypy.ini)
-
-```ini
-[mypy]
-python_version = 3.10
-warn_return_any = False
-warn_unused_configs = True
-disallow_untyped_defs = False
-check_untyped_defs = True
-ignore_missing_imports = True
-no_implicit_optional = True
-show_error_codes = True
-
-# Gradual typing - be lenient for now
-disallow_incomplete_defs = False
-disallow_untyped_calls = False
+### MyPy Configuration (from pyproject.toml)
+
+```toml
+[tool.mypy]
+python_version = "3.10"
+warn_return_any = true
+warn_unused_configs = true
+disallow_untyped_defs = false
+disallow_incomplete_defs = false
+check_untyped_defs = true
+ignore_missing_imports = true
+show_error_codes = true
+pretty = true
 ```
 
 ### Code Conventions
@@ -662,17 +645,6 @@ Preset configs are in `configs/` directory:
 - `astrovalley_unified.json` - Astrovalley
 - `configs/integrations/` - Integration-specific configs
 
-### Configuration Documentation
-
-Preset configs are in `configs/` directory:
-- `godot.json` - Godot Engine
-- `blender.json` / `blender-unified.json` - Blender Engine
-- `claude-code.json` - Claude Code
-- `httpx_comprehensive.json` - HTTPX library
-- `medusa-mercurjs.json` - Medusa/MercurJS
-- `astrovalley_unified.json` - Astrovalley
-- `configs/integrations/` - Integration-specific configs
-
 ---
 
 ## Key Dependencies
@@ -700,6 +672,8 @@ Preset configs are in `configs/` directory:
 | `python-dotenv` | >=1.1.1 | Environment variables |
 | `jsonschema` | >=4.25.1 | JSON validation |
 | `PyYAML` | >=6.0 | YAML parsing |
+| `langchain` | >=1.2.10 | LangChain integration |
+| `llama-index` | >=0.14.15 | LlamaIndex integration |
 
 ### Optional Dependencies
 
@@ -852,4 +826,4 @@ Skill Seekers uses JSON configuration files to define scraping targets. Example
 
 *This document is maintained for AI coding agents. For human contributors, see README.md and CONTRIBUTING.md.*
 
-*Last updated: 2026-02-16*
+*Last updated: 2026-02-24*
@@ -109,6 +109,12 @@ azure = [
     "azure-storage-blob>=12.19.0",
 ]
 
+# Word document (.docx) support
+docx = [
+    "mammoth>=1.6.0",
+    "python-docx>=1.1.0",
+]
+
 # RAG vector database upload support
 chroma = [
     "chromadb>=0.4.0",
@@ -146,6 +152,8 @@ embedding = [
 
 # All optional dependencies combined (dev dependencies now in [dependency-groups])
 all = [
+    "mammoth>=1.6.0",
+    "python-docx>=1.1.0",
     "mcp>=1.25,<2",
     "httpx>=0.28.1",
     "httpx-sse>=0.4.3",
@@ -186,6 +194,7 @@ skill-seekers-resume = "skill_seekers.cli.resume_command:main"
 skill-seekers-scrape = "skill_seekers.cli.doc_scraper:main"
 skill-seekers-github = "skill_seekers.cli.github_scraper:main"
 skill-seekers-pdf = "skill_seekers.cli.pdf_scraper:main"
+skill-seekers-word = "skill_seekers.cli.word_scraper:main"
 skill-seekers-unified = "skill_seekers.cli.unified_scraper:main"
 skill-seekers-enhance = "skill_seekers.cli.enhance_command:main"
 skill-seekers-enhance-status = "skill_seekers.cli.enhance_status:main"
 
@@ -21,6 +21,7 @@
 from .scrape import add_scrape_arguments, SCRAPE_ARGUMENTS
 from .github import add_github_arguments, GITHUB_ARGUMENTS
 from .pdf import add_pdf_arguments, PDF_ARGUMENTS
+from .word import add_word_arguments, WORD_ARGUMENTS
 from .analyze import add_analyze_arguments, ANALYZE_ARGUMENTS
 from .unified import add_unified_arguments, UNIFIED_ARGUMENTS
 from .package import add_package_arguments, PACKAGE_ARGUMENTS
@@ -38,11 +39,13 @@
     "add_package_arguments",
     "add_upload_arguments",
     "add_enhance_arguments",
+    "add_word_arguments",
     # Data
     "COMMON_ARGUMENTS",
     "SCRAPE_ARGUMENTS",
     "GITHUB_ARGUMENTS",
     "PDF_ARGUMENTS",
+    "WORD_ARGUMENTS",
     "ANALYZE_ARGUMENTS",
     "UNIFIED_ARGUMENTS",
     "PACKAGE_ARGUMENTS",
 
@@ -389,6 +389,18 @@
     },
 }
 
+# Word document specific (from word.py)
+WORD_ARGUMENTS: dict[str, dict[str, Any]] = {
+    "docx": {
+        "flags": ("--docx",),
+        "kwargs": {
+            "type": str,
+            "help": "DOCX file path",
+            "metavar": "PATH",
+        },
+    },
+}
+
 # Multi-source config specific (from unified_scraper.py)
 CONFIG_ARGUMENTS: dict[str, dict[str, Any]] = {
     "merge_mode": {
@@ -471,6 +483,7 @@ def get_source_specific_arguments(source_type: str) -> dict[str, dict[str, Any]]
         "github": GITHUB_ARGUMENTS,
         "local": LOCAL_ARGUMENTS,
         "pdf": PDF_ARGUMENTS,
+        "word": WORD_ARGUMENTS,
         "config": CONFIG_ARGUMENTS,
     }
     return source_args.get(source_type, {})
@@ -507,12 +520,13 @@ def add_create_arguments(parser: argparse.ArgumentParser, mode: str = "default")
     - 'github': Universal + github-specific
     - 'local': Universal + local-specific
     - 'pdf': Universal + pdf-specific
+    - 'word': Universal + word-specific
     - 'advanced': Advanced/rare arguments
     - 'all': All 120+ arguments
 
     Args:
         parser: ArgumentParser to add arguments to
-        mode: Help mode (default, web, github, local, pdf, advanced, all)
+        mode: Help mode (default, web, github, local, pdf, word, advanced, all)
     """
     # Positional argument for source
     parser.add_argument(
@@ -543,6 +557,10 @@ def add_create_arguments(parser: argparse.ArgumentParser, mode: str = "default")
         for arg_name, arg_def in PDF_ARGUMENTS.items():
             parser.add_argument(*arg_def["flags"], **arg_def["kwargs"])
 
+    if mode in ["word", "all"]:
+        for arg_name, arg_def in WORD_ARGUMENTS.items():
+            parser.add_argument(*arg_def["flags"], **arg_def["kwargs"])
+
     if mode in ["config", "all"]:
         for arg_name, arg_def in CONFIG_ARGUMENTS.items():
             parser.add_argument(*arg_def["flags"], **arg_def["kwargs"])
 
@@ -0,0 +1,66 @@
+"""Word document command argument definitions.
+
+This module defines ALL arguments for the word command in ONE place.
+Both word_scraper.py (standalone) and parsers/word_parser.py (unified CLI)
+import and use these definitions.
+
+Shared arguments (name, description, output, enhance-level, api-key,
+dry-run, verbose, quiet, workflow args) come from common.py / workflow.py
+via ``add_all_standard_arguments()``.
+"""
+
+import argparse
+from typing import Any
+
+from .common import add_all_standard_arguments
+
+# Word-specific argument definitions as data structure
+# NOTE: Shared args (name, description, output, enhance_level, api_key, dry_run,
+#       verbose, quiet, workflow args) are registered by add_all_standard_arguments().
+WORD_ARGUMENTS: dict[str, dict[str, Any]] = {
+    "docx": {
+        "flags": ("--docx",),
+        "kwargs": {
+            "type": str,
+            "help": "Direct DOCX file path",
+            "metavar": "PATH",
+        },
+    },
+    "from_json": {
+        "flags": ("--from-json",),
+        "kwargs": {
+            "type": str,
+            "help": "Build skill from extracted JSON",
+            "metavar": "FILE",
+        },
+    },
+}
+
+
+def add_word_arguments(parser: argparse.ArgumentParser) -> None:
+    """Add all word command arguments to a parser.
+
+    Registers shared args (name, description, output, enhance-level, api-key,
+    dry-run, verbose, quiet, workflow args) via add_all_standard_arguments(),
+    then adds Word-specific args on top.
+
+    The default for --enhance-level is overridden to 0 (disabled) for Word.
+    """
+    # Shared universal args first
+    add_all_standard_arguments(parser)
+
+    # Override enhance-level default to 0 for Word
+    for action in parser._actions:
+        if hasattr(action, "dest") and action.dest == "enhance_level":
+            action.default = 0
+            action.help = (
+                "AI enhancement level (auto-detects API vs LOCAL mode): "
+                "0=disabled (default for Word), 1=SKILL.md only, 2=+architecture/config, 3=full enhancement. "
+                "Mode selection: uses API if ANTHROPIC_API_KEY is set, otherwise LOCAL (Claude Code)"
+            )
+
+    # Word-specific args
+    for arg_name, arg_def in WORD_ARGUMENTS.items():
+        flags = arg_def["flags"]
+        kwargs = arg_def["kwargs"]
+        parser.add_argument(*flags, **kwargs)