final

Electroiscoding · Electroiscoding · commit d012efbc3a33 · 2026-03-17T20:04:18.000+05:30
diff --git a/demo.py b/demo.py
@@ -1,4 +1,3 @@
-# Crayon v5.1.0 Demo
 
 from crayon import CrayonVocab
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -4,10 +4,10 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "xerv-crayon"
-version = "5.2.0"
+version = "5.2.4"
 description = "Omni-Backend Tokenizer - CPU (AVX2/512), CUDA (NVIDIA), ROCm (AMD) with automatic hardware detection"
 readme = "README.md"
-requires-python = ">=3.8"
+requires-python = ">=3.8,<3.13"
 license = {file = "LICENSE"}
 authors = [
   {name = "Xerv Research Engineering Division", email = "engineering@xerv.ai"}
diff --git a/setup.py b/setup.py
@@ -1,311 +1,59 @@
 """
-XERV CRAYON SETUP v5.2.0 - Production Omni-Backend Build System
-================================================================
-GUARANTEED CUDA SUPPORT - PyTorch 2.10+ Compatible
+XERV CRAYON SETUP v5.2.3 - PRODUCTION BUILD
+============================================
+With CPU extensions for guaranteed performance
 """
 
 import os
 import sys
-import subprocess
-import shutil
 from setuptools import setup, Extension, find_packages
-from setuptools.command.build_ext import build_ext
-from distutils.sysconfig import get_python_inc
 
-VERSION = "5.2.0"
+VERSION = "5.2.4"
 
-def log(msg: str, level: str = "INFO") -> None:
+def log(msg: str) -> None:
     print(f"[CRAYON-BUILD] {msg}", flush=True)
 
-# ============================================================================
-# CUDA DETECTION AND COMPILATION - GUARANTEED TO WORK
-# ============================================================================
-
-FORCE_CPU = os.environ.get("CRAYON_FORCE_CPU", "0") == "1"
-FORCE_CUDA = os.environ.get("CRAYON_FORCE_CUDA", "0") == "1"
-os.environ["MAX_JOBS"] = os.environ.get("MAX_JOBS", "1")
-
-# Detect PyTorch & CUDA - ROBUST DETECTION
-try:
-    import torch
-    log(f"PyTorch v{torch.__version__} detected")
-    
-    # Initialize CUDA variables
-    CUDAExtension = None
-    BuildExtension = None
-    CUDA_HOME = None
-    TORCH_CUDA_AVAILABLE = False
-    
-    # Check PyTorch CUDA availability first
-    if torch.cuda.is_available():
-        log(" PyTorch CUDA is available")
-        TORCH_CUDA_AVAILABLE = True
-        
-        # Try all possible import methods for PyTorch 2.10+
-        import_methods = [
-            # Method 1: Old path (PyTorch < 2.10)
-            lambda: __import__('torch.utils.cpp_extension', fromlist=['CUDAExtension', 'BuildExtension', 'CUDA_HOME']),
-            # Method 2: New path (PyTorch 2.10+)
-            lambda: __import__('torch.cuda.cpp_extension', fromlist=['CUDAExtension', 'BuildExtension', 'CUDA_HOME']),
-            # Method 3: Direct import via torch.cuda
-            lambda: __import__('torch.cuda.cpp_extension'),
-        ]
-        
-        for i, method in enumerate(import_methods, 1):
-            try:
-                module = method()
-                CUDAExtension = getattr(module, 'CUDAExtension', None)
-                BuildExtension = getattr(module, 'BuildExtension', None)
-                CUDA_HOME = getattr(module, 'CUDA_HOME', None)
-                
-                if CUDAExtension and BuildExtension:
-                    log(f"✓ Method {i} successful: PyTorch CUDA extensions available")
-                    break
-            except (ImportError, AttributeError) as e:
-                log(f"Method {i} failed: {e}")
-                continue
-        
-        # Fallback: Manual CUDA_HOME detection
-        if not CUDA_HOME:
-            CUDA_HOME = os.environ.get('CUDA_HOME', '/usr/local/cuda')
-            if os.path.exists(CUDA_HOME):
-                log(f"✓ CUDA_HOME detected: {CUDA_HOME}")
-            else:
-                log("! CUDA_HOME not found, will try to build anyway")
-                CUDA_HOME = '/usr/local/cuda'  # Default for most systems
-        
-        # Final check
-        if CUDAExtension and BuildExtension:
-            log("✓ All CUDA components available for build")
-        else:
-            log("! CUDA extension components not available, will use manual build")
-            CUDAExtension = None
-            BuildExtension = None
-    
-    else:
-        log("PyTorch CUDA not available")
-        if FORCE_CUDA:
-            log("Forced CUDA build enabled (CRAYON_FORCE_CUDA=1)")
-            TORCH_CUDA_AVAILABLE = True
-        else:
-            TORCH_CUDA_AVAILABLE = False
-            
-except ImportError:
-    log("PyTorch not installed")
-    TORCH_CUDA_AVAILABLE = False
-    CUDAExtension = None
-    BuildExtension = None
-    CUDA_HOME = None
-
-# ============================================================================
-# ROBUST CUDA BUILD CLASS
-# ============================================================================
-
-class CrayonBuildExt(build_ext):
-    """Custom build class that handles CUDA compilation with maximum compatibility"""
-    
-    def build_extension(self, ext):
-        if ext.name == "crayon.c_ext.crayon_cuda":
-            self._build_cuda_extension_robust(ext)
-        else:
-            super().build_extension(ext)
-    
-    def _build_cuda_extension_robust(self, ext):
-        """Build CUDA extension with maximum compatibility"""
-        log(f"Building CUDA extension: {ext.name}")
-        
-        # Get Python version info
-        python_version = f"{sys.version_info.major}.{sys.version_info.minor}"
-        
-        # Try multiple include paths
-        include_paths = []
-        
-        # Python include
-        python_includes = [
-            f"/usr/include/python{python_version}",
-            f"/usr/local/include/python{python_version}",
-            get_python_inc(),
-        ]
-        for inc in python_includes:
-            if os.path.exists(inc):
-                include_paths.append(f"-I{inc}")
-                break
-        
-        # Torch include paths
-        try:
-            import torch
-            torch_path = os.path.dirname(torch.__file__)
-            torch_includes = [
-                f"{torch_path}/include",
-                f"{torch_path}/include/torch/csrc/api/include",
-                f"{torch_path}/../include",
-            ]
-            for inc in torch_includes:
-                if os.path.exists(inc):
-                    include_paths.append(f"-I{inc}")
-        except:
-            pass
-        
-        # CUDA include paths
-        cuda_includes = [
-            os.environ.get('CUDA_HOME', '/usr/local/cuda'),
-            '/usr/local/cuda',
-            '/usr/cuda',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.8',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.7',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.6',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.5',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.4',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.3',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.2',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.1',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v12.0',
-            'C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v11.8',
-        ]
-        
-        cuda_include = None
-        for inc in cuda_includes:
-            if os.path.exists(inc):
-                cuda_include = f"{inc}/include"
-                include_paths.append(f"-I{cuda_include}")
-                log(f"✓ CUDA include found: {cuda_include}")
-                break
-        
-        if not cuda_include:
-            log("! CUDA include not found, trying default paths")
-            cuda_include = "/usr/local/cuda/include"
-            include_paths.append(f"-I{cuda_include}")
-        
-        # Build command for different platforms
-        if sys.platform == "win32":
-            # Windows build
-            cmd = [
-                "nvcc",
-                "-O3", "-std=c++17",
-                "--compiler-options", "/MD",
-                "-shared",
-                "-o", self.get_ext_fullname(ext.name).replace('.', '/') + ".pyd",
-                ext.sources[0],
-            ] + include_paths + [
-                "-D_GLIBCXX_USE_CXX11_ABI=0",
-                "-Xcompiler", "/EHsc",
-            ]
-        else:
-            # Linux build
-            cmd = [
-                "nvcc",
-                "-O3", "-std=c++17",
-                "--compiler-options", "-fPIC",
-                "-shared",
-                "-o", self.get_ext_fullname(ext.name).replace('.', '/') + ".so",
-                ext.sources[0],
-            ] + include_paths + [
-                "-D_GLIBCXX_USE_CXX11_ABI=0",
-            ]
-        
-        # Add GPU architecture flags
-        try:
-            if torch.cuda.is_available():
-                major, minor = torch.cuda.get_device_capability()
-                arch = f"{major}{minor}"
-                cmd.extend([f"-gencode=arch=compute_{arch},code=sm_{arch}"])
-                log(f"Compiling for GPU architecture: sm_{arch}")
-            else:
-                cmd.extend(["-gencode=arch=compute_75,code=sm_75"])
-                log("Using default GPU architecture: sm_75")
-        except:
-            cmd.extend(["-gencode=arch=compute_75,code=sm_75"])
-            log("Using default GPU architecture: sm_75")
-        
-        log(f"CUDA build command: {' '.join(cmd)}")
-        
-        try:
-            # Create output directory
-            output_dir = os.path.dirname(self.get_ext_fullname(ext.name).replace('.', '/'))
-            os.makedirs(os.path.join(self.build_lib, output_dir), exist_ok=True)
-            
-            # Run compilation
-            result = subprocess.run(cmd, capture_output=True, text=True, cwd=self.build_lib)
-            if result.returncode == 0:
-                log(f"✓ CUDA extension {ext.name} built successfully")
-            else:
-                log(f"✗ CUDA build failed: {result.stderr}")
-                # Don't raise error, just log it - extension will be skipped
-                log("CUDA extension will be skipped, continuing with CPU-only build")
-        except Exception as e:
-            log(f"CUDA build error: {e}")
-            log("CUDA extension will be skipped, continuing with CPU-only build")
-
-# ============================================================================
-# EXTENSION CONFIGURATION
-# ============================================================================
+# Compiler flags
+if sys.platform == "win32":
+    cpu_cflags = ["/O2", "/std:c++17"]
+else:
+    cpu_cflags = ["-O3", "-fPIC", "-std=c++17"]
 
+# CPU Extensions (always built)
 ext_modules = []
 
-# CPU Extensions (always built)
-if sys.platform == "win32":
-    cpu_args = ["/O2", "/std:c++17"]
-else:
-    cpu_args = ["-O3", "-fPIC", "-std=c++17"]
+log("Adding CPU extensions...")
 
-# CPU Extension
 ext_modules.append(Extension(
     "crayon.c_ext.crayon_cpu",
     sources=["src/crayon/c_ext/cpu_engine.cpp"],
-    extra_compile_args=cpu_args,
+    extra_compile_args=cpu_cflags,
     language="c++",
 ))
 
-# Trainer Extension
 ext_modules.append(Extension(
-    "crayon.c_ext.crayon_trainer", 
+    "crayon.c_ext.crayon_trainer",
     sources=["src/crayon/c_ext/trainer.cpp"],
-    extra_compile_args=cpu_args,
+    extra_compile_args=cpu_cflags,
     language="c++",
 ))
 
-# Compiler Extension
 ext_modules.append(Extension(
     "crayon.c_ext.crayon_compiler",
     sources=["src/crayon/c_ext/compiler.cpp"],
-    extra_compile_args=cpu_args,
+    extra_compile_args=cpu_cflags,
     language="c++",
 ))
 
-# CUDA Extension (if available)
-if (TORCH_CUDA_AVAILABLE or FORCE_CUDA) and not FORCE_CPU:
-    log("Adding CUDA extension to build queue")
-    
-    # Use our robust build class
-    cuda_ext = Extension(
-        "crayon.c_ext.crayon_cuda",
-        sources=["src/crayon/c_ext/gpu_engine_cuda.cu"],
-        extra_compile_args={"nvcc": ["-O3", "-std=c++17", "--expt-relaxed-constexpr"]},
-        language="c++",
-    )
-    ext_modules.append(cuda_ext)
-    
-    # Use custom build class
-    cmdclass = {"build_ext": CrayonBuildExt}
-    log("Using robust CUDA build class")
-    
-else:
-    cmdclass = {}
-    if not FORCE_CPU:
-        log("Skipping CUDA extension - not available or forced CPU")
-
-# ============================================================================
-# SETUP
-# ============================================================================
-
 setup(
     name="xerv-crayon",
     version=VERSION,
     packages=find_packages("src"),
     package_dir={"": "src"},
     include_package_data=True,
     ext_modules=ext_modules,
-    cmdclass=cmdclass,
-    python_requires=">=3.8",
-    zip_safe=False,
-)
+    python_requires=">=3.8,<3.14",
+    install_requires=[
+        "numpy>=1.21.0",
+    ],
+)

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,3 @@`
`1`		`-# Crayon v5.1.0 Demo`
`2`	`1`
`3`	`2`	`from crayon import CrayonVocab`
`4`	`3`