|
|
""" |
|
|
Documentation management for backend system prompts. |
|
|
Handles fetching, caching, and updating documentation from llms.txt files. |
|
|
No dependencies on Gradio or other heavy libraries - pure Python only. |
|
|
""" |
|
|
import os |
|
|
import re |
|
|
from datetime import datetime |
|
|
from typing import Optional |
|
|
|
|
|
try: |
|
|
import requests |
|
|
HAS_REQUESTS = True |
|
|
except ImportError: |
|
|
HAS_REQUESTS = False |
|
|
print("Warning: requests library not available, using minimal fallback") |
|
|
|
|
|
|
|
|
GRADIO_LLMS_TXT_URL = "https://www.gradio.app/llms.txt" |
|
|
GRADIO_DOCS_CACHE_FILE = ".backend_gradio_docs_cache.txt" |
|
|
GRADIO_DOCS_LAST_UPDATE_FILE = ".backend_gradio_docs_last_update.txt" |
|
|
|
|
|
TRANSFORMERSJS_DOCS_URL = "https://huggingface.co/docs/transformers.js/llms.txt" |
|
|
TRANSFORMERSJS_DOCS_CACHE_FILE = ".backend_transformersjs_docs_cache.txt" |
|
|
TRANSFORMERSJS_DOCS_LAST_UPDATE_FILE = ".backend_transformersjs_docs_last_update.txt" |
|
|
|
|
|
|
|
|
_gradio_docs_content: Optional[str] = None |
|
|
_gradio_docs_last_fetched: Optional[datetime] = None |
|
|
|
|
|
|
|
|
_transformersjs_docs_content: Optional[str] = None |
|
|
_transformersjs_docs_last_fetched: Optional[datetime] = None |
|
|
|
|
|
def fetch_gradio_docs() -> Optional[str]: |
|
|
"""Fetch the latest Gradio documentation from llms.txt""" |
|
|
if not HAS_REQUESTS: |
|
|
return None |
|
|
|
|
|
try: |
|
|
response = requests.get(GRADIO_LLMS_TXT_URL, timeout=10) |
|
|
response.raise_for_status() |
|
|
return response.text |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to fetch Gradio docs from {GRADIO_LLMS_TXT_URL}: {e}") |
|
|
return None |
|
|
|
|
|
def fetch_transformersjs_docs() -> Optional[str]: |
|
|
"""Fetch the latest transformers.js documentation from llms.txt""" |
|
|
if not HAS_REQUESTS: |
|
|
return None |
|
|
|
|
|
try: |
|
|
response = requests.get(TRANSFORMERSJS_DOCS_URL, timeout=10) |
|
|
response.raise_for_status() |
|
|
return response.text |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to fetch transformers.js docs from {TRANSFORMERSJS_DOCS_URL}: {e}") |
|
|
return None |
|
|
|
|
|
def filter_problematic_instructions(content: str) -> str: |
|
|
"""Filter out problematic instructions that cause LLM to stop generation prematurely""" |
|
|
if not content: |
|
|
return content |
|
|
|
|
|
|
|
|
problematic_patterns = [ |
|
|
r"Output ONLY the code inside a ``` code block, and do not include any explanations or extra text", |
|
|
r"output only the code inside a ```.*?``` code block", |
|
|
r"Always output only the.*?code.*?inside.*?```.*?```.*?block", |
|
|
r"Return ONLY the code inside a.*?```.*?``` code block", |
|
|
r"Do NOT add the language name at the top of the code output", |
|
|
r"do not include any explanations or extra text", |
|
|
r"Always output only the.*?code blocks.*?shown above, and do not include any explanations", |
|
|
r"Output.*?ONLY.*?code.*?inside.*?```.*?```", |
|
|
r"Return.*?ONLY.*?code.*?inside.*?```.*?```", |
|
|
r"Generate.*?ONLY.*?code.*?inside.*?```.*?```", |
|
|
r"Provide.*?ONLY.*?code.*?inside.*?```.*?```", |
|
|
] |
|
|
|
|
|
|
|
|
filtered_content = content |
|
|
for pattern in problematic_patterns: |
|
|
|
|
|
filtered_content = re.sub(pattern, "", filtered_content, flags=re.IGNORECASE | re.DOTALL) |
|
|
|
|
|
|
|
|
filtered_content = re.sub(r'\n\s*\n\s*\n', '\n\n', filtered_content) |
|
|
filtered_content = re.sub(r'^\s+', '', filtered_content, flags=re.MULTILINE) |
|
|
|
|
|
return filtered_content |
|
|
|
|
|
def load_cached_gradio_docs() -> Optional[str]: |
|
|
"""Load cached Gradio documentation from file""" |
|
|
try: |
|
|
if os.path.exists(GRADIO_DOCS_CACHE_FILE): |
|
|
with open(GRADIO_DOCS_CACHE_FILE, 'r', encoding='utf-8') as f: |
|
|
return f.read() |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to load cached Gradio docs: {e}") |
|
|
return None |
|
|
|
|
|
def save_gradio_docs_cache(content: str): |
|
|
"""Save Gradio documentation to cache file""" |
|
|
try: |
|
|
with open(GRADIO_DOCS_CACHE_FILE, 'w', encoding='utf-8') as f: |
|
|
f.write(content) |
|
|
with open(GRADIO_DOCS_LAST_UPDATE_FILE, 'w', encoding='utf-8') as f: |
|
|
f.write(datetime.now().isoformat()) |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to save Gradio docs cache: {e}") |
|
|
|
|
|
def should_update_gradio_docs() -> bool: |
|
|
"""Check if Gradio documentation should be updated""" |
|
|
|
|
|
return not os.path.exists(GRADIO_DOCS_CACHE_FILE) |
|
|
|
|
|
def load_cached_transformersjs_docs() -> Optional[str]: |
|
|
"""Load cached transformers.js documentation from file""" |
|
|
try: |
|
|
if os.path.exists(TRANSFORMERSJS_DOCS_CACHE_FILE): |
|
|
with open(TRANSFORMERSJS_DOCS_CACHE_FILE, 'r', encoding='utf-8') as f: |
|
|
return f.read() |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to load cached transformers.js docs: {e}") |
|
|
return None |
|
|
|
|
|
def save_transformersjs_docs_cache(content: str): |
|
|
"""Save transformers.js documentation to cache file""" |
|
|
try: |
|
|
with open(TRANSFORMERSJS_DOCS_CACHE_FILE, 'w', encoding='utf-8') as f: |
|
|
f.write(content) |
|
|
with open(TRANSFORMERSJS_DOCS_LAST_UPDATE_FILE, 'w', encoding='utf-8') as f: |
|
|
f.write(datetime.now().isoformat()) |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to save transformers.js docs cache: {e}") |
|
|
|
|
|
def should_update_transformersjs_docs() -> bool: |
|
|
"""Check if transformers.js documentation should be updated""" |
|
|
|
|
|
return not os.path.exists(TRANSFORMERSJS_DOCS_CACHE_FILE) |
|
|
|
|
|
def get_gradio_docs_content() -> str: |
|
|
"""Get the current Gradio documentation content, updating if necessary""" |
|
|
global _gradio_docs_content, _gradio_docs_last_fetched |
|
|
|
|
|
|
|
|
if (_gradio_docs_content is None or |
|
|
_gradio_docs_last_fetched is None or |
|
|
should_update_gradio_docs()): |
|
|
|
|
|
print("π Loading Gradio 6 documentation...") |
|
|
|
|
|
|
|
|
latest_content = fetch_gradio_docs() |
|
|
|
|
|
if latest_content: |
|
|
|
|
|
filtered_content = filter_problematic_instructions(latest_content) |
|
|
_gradio_docs_content = filtered_content |
|
|
_gradio_docs_last_fetched = datetime.now() |
|
|
save_gradio_docs_cache(filtered_content) |
|
|
print(f"β
Gradio 6 documentation loaded successfully ({len(filtered_content)} chars)") |
|
|
else: |
|
|
|
|
|
cached_content = load_cached_gradio_docs() |
|
|
if cached_content: |
|
|
_gradio_docs_content = cached_content |
|
|
_gradio_docs_last_fetched = datetime.now() |
|
|
print(f"β οΈ Using cached Gradio documentation (network fetch failed) ({len(cached_content)} chars)") |
|
|
else: |
|
|
|
|
|
_gradio_docs_content = """ |
|
|
# Gradio API Reference (Offline Fallback) |
|
|
|
|
|
This is a minimal fallback when documentation cannot be fetched. |
|
|
Please check your internet connection for the latest API reference. |
|
|
|
|
|
Basic Gradio components: Button, Textbox, Slider, Image, Audio, Video, File, etc. |
|
|
Use gr.Blocks() for custom layouts and gr.Interface() for simple apps. |
|
|
|
|
|
For the latest documentation, visit: https://www.gradio.app/llms.txt |
|
|
""" |
|
|
print("β Using minimal fallback documentation") |
|
|
|
|
|
return _gradio_docs_content or "" |
|
|
|
|
|
def get_transformersjs_docs_content() -> str: |
|
|
"""Get the current transformers.js documentation content, updating if necessary""" |
|
|
global _transformersjs_docs_content, _transformersjs_docs_last_fetched |
|
|
|
|
|
|
|
|
if (_transformersjs_docs_content is None or |
|
|
_transformersjs_docs_last_fetched is None or |
|
|
should_update_transformersjs_docs()): |
|
|
|
|
|
print("π Loading transformers.js documentation...") |
|
|
|
|
|
|
|
|
latest_content = fetch_transformersjs_docs() |
|
|
|
|
|
if latest_content: |
|
|
|
|
|
filtered_content = filter_problematic_instructions(latest_content) |
|
|
_transformersjs_docs_content = filtered_content |
|
|
_transformersjs_docs_last_fetched = datetime.now() |
|
|
save_transformersjs_docs_cache(filtered_content) |
|
|
print(f"β
transformers.js documentation loaded successfully ({len(filtered_content)} chars)") |
|
|
else: |
|
|
|
|
|
cached_content = load_cached_transformersjs_docs() |
|
|
if cached_content: |
|
|
_transformersjs_docs_content = cached_content |
|
|
_transformersjs_docs_last_fetched = datetime.now() |
|
|
print(f"β οΈ Using cached transformers.js documentation (network fetch failed) ({len(cached_content)} chars)") |
|
|
else: |
|
|
|
|
|
_transformersjs_docs_content = """ |
|
|
# Transformers.js API Reference (Offline Fallback) |
|
|
|
|
|
This is a minimal fallback when documentation cannot be fetched. |
|
|
Please check your internet connection for the latest API reference. |
|
|
|
|
|
Transformers.js allows you to run π€ Transformers models directly in the browser using ONNX Runtime. |
|
|
|
|
|
Key features: |
|
|
- pipeline() API for common tasks (sentiment-analysis, text-generation, etc.) |
|
|
- Support for custom models via model ID or path |
|
|
- WebGPU support for GPU acceleration |
|
|
- Quantization support (fp32, fp16, q8, q4) |
|
|
|
|
|
Basic usage: |
|
|
```javascript |
|
|
import { pipeline } from '@huggingface/transformers'; |
|
|
const pipe = await pipeline('sentiment-analysis'); |
|
|
const out = await pipe('I love transformers!'); |
|
|
``` |
|
|
|
|
|
For the latest documentation, visit: https://huggingface.co/docs/transformers.js |
|
|
""" |
|
|
print("β Using minimal fallback transformers.js documentation") |
|
|
|
|
|
return _transformersjs_docs_content or "" |
|
|
|
|
|
def build_gradio_system_prompt() -> str: |
|
|
"""Build the complete Gradio system prompt with full documentation""" |
|
|
|
|
|
|
|
|
docs_content = get_gradio_docs_content() |
|
|
|
|
|
|
|
|
base_prompt = """π¨ CRITICAL: You are an expert Gradio 6 developer. You MUST use Gradio 6 syntax and API. |
|
|
|
|
|
## Key Gradio 6 Changes (MUST FOLLOW): |
|
|
- Use `footer_links` parameter instead of removed `show_api` in gr.Blocks() |
|
|
- Use `api_visibility` instead of `api_name` in event listeners |
|
|
- Use modern Gradio 6 component syntax (check documentation below) |
|
|
- Gradio 6 has updated component APIs - always refer to the documentation below |
|
|
- DO NOT use deprecated Gradio 5 or older syntax |
|
|
|
|
|
Create a complete, working Gradio 6 application based on the user's request. Generate all necessary code to make the application functional and runnable. |
|
|
|
|
|
## Gradio 6 Example (Your Code Should Follow This Pattern): |
|
|
|
|
|
```python |
|
|
import gradio as gr |
|
|
|
|
|
def process(text): |
|
|
return f"Processed: {text}" |
|
|
|
|
|
# Gradio 6 Blocks with footer_links (NOT show_api) |
|
|
with gr.Blocks( |
|
|
title="My App", |
|
|
footer_links=[{"label": "Built with anycoder", "url": "https://huggingface.co/spaces/akhaliq/anycoder"}] |
|
|
) as demo: |
|
|
with gr.Row(): |
|
|
input_text = gr.Textbox(label="Input") |
|
|
output_text = gr.Textbox(label="Output") |
|
|
|
|
|
btn = gr.Button("Process") |
|
|
|
|
|
# Gradio 6 events use api_visibility (NOT just api_name) |
|
|
btn.click( |
|
|
fn=process, |
|
|
inputs=[input_text], |
|
|
outputs=[output_text], |
|
|
api_visibility="public" # Gradio 6 syntax |
|
|
) |
|
|
|
|
|
demo.launch() |
|
|
``` |
|
|
|
|
|
## Multi-File Application Structure |
|
|
|
|
|
When creating Gradio applications, organize your code into multiple files for proper deployment: |
|
|
|
|
|
**File Organization:** |
|
|
- `app.py` - Main application entry point (REQUIRED) |
|
|
- `requirements.txt` - Python dependencies (REQUIRED, auto-generated from imports) |
|
|
- `utils.py` - Utility functions and helpers (optional) |
|
|
- `models.py` - Model loading and inference functions (optional) |
|
|
- `config.py` - Configuration and constants (optional) |
|
|
|
|
|
**Output Format:** |
|
|
You MUST use this exact format with file separators: |
|
|
|
|
|
=== app.py === |
|
|
[complete app.py content] |
|
|
|
|
|
=== utils.py === |
|
|
[utility functions - if needed] |
|
|
|
|
|
**π¨ CRITICAL: DO NOT GENERATE requirements.txt or README.md** |
|
|
- requirements.txt is automatically generated from your app.py imports |
|
|
- README.md is automatically provided by the template |
|
|
- Generating these files will break the deployment process |
|
|
|
|
|
Requirements: |
|
|
1. Create a modern, intuitive Gradio application |
|
|
2. Use appropriate Gradio components (gr.Textbox, gr.Slider, etc.) |
|
|
3. Include proper error handling and loading states |
|
|
4. Use gr.Interface or gr.Blocks as appropriate |
|
|
5. Add helpful descriptions and examples |
|
|
6. Follow Gradio best practices |
|
|
7. Make the UI user-friendly with clear labels |
|
|
8. Include proper documentation in docstrings |
|
|
|
|
|
IMPORTANT: Always include "Built with anycoder" as clickable text in the header/top section of your application that links to https://huggingface.co/spaces/akhaliq/anycoder |
|
|
|
|
|
--- |
|
|
|
|
|
## Complete Gradio 6 Documentation |
|
|
|
|
|
Below is the complete, official Gradio 6 documentation automatically synced from https://www.gradio.app/llms.txt: |
|
|
|
|
|
""" |
|
|
|
|
|
|
|
|
full_prompt = base_prompt + docs_content |
|
|
|
|
|
|
|
|
final_instructions = """ |
|
|
|
|
|
--- |
|
|
|
|
|
## π¨ CRITICAL FINAL INSTRUCTIONS - GRADIO 6 ONLY |
|
|
|
|
|
YOU MUST USE GRADIO 6 SYNTAX. This is MANDATORY: |
|
|
|
|
|
1. **ONLY use Gradio 6 API** - Do NOT use Gradio 5 or older syntax |
|
|
2. **Reference the documentation above** - All function signatures and patterns are from Gradio 6 |
|
|
3. **Use modern Gradio 6 patterns:** |
|
|
- Use `footer_links` parameter in gr.Blocks() (NOT show_api) |
|
|
- Use `api_visibility` in event listeners (NOT api_name alone) |
|
|
- Use updated component syntax from Gradio 6 documentation |
|
|
4. **Follow Gradio 6 migration guide** if you see any deprecated patterns |
|
|
5. **Generate production-ready Gradio 6 code** that follows all best practices |
|
|
6. **Always include "Built with anycoder"** as clickable text in the header linking to https://huggingface.co/spaces/akhaliq/anycoder |
|
|
|
|
|
REMINDER: You are writing Gradio 6 code. Double-check all syntax against the Gradio 6 documentation provided above. |
|
|
|
|
|
""" |
|
|
|
|
|
return full_prompt + final_instructions |
|
|
|
|
|
def build_transformersjs_system_prompt() -> str: |
|
|
"""Build the complete transformers.js system prompt with full documentation""" |
|
|
|
|
|
|
|
|
docs_content = get_transformersjs_docs_content() |
|
|
|
|
|
|
|
|
base_prompt = """You are an expert transformers.js developer. Create a complete, working browser-based ML application using transformers.js based on the user's request. Generate all necessary code to make the application functional and runnable in the browser. |
|
|
|
|
|
## Multi-File Application Structure |
|
|
|
|
|
When creating transformers.js applications, organize your code into multiple files for proper deployment: |
|
|
|
|
|
**File Organization:** |
|
|
- `index.html` - Main HTML entry point (REQUIRED) |
|
|
- `app.js` - Main JavaScript application logic (REQUIRED) |
|
|
- `styles.css` - Styling (optional) |
|
|
- `worker.js` - Web Worker for model loading (recommended for better performance) |
|
|
- `package.json` - Node.js dependencies if using bundler (optional) |
|
|
|
|
|
**Output Format:** |
|
|
You MUST use this exact format with file separators: |
|
|
|
|
|
=== index.html === |
|
|
[complete HTML content] |
|
|
|
|
|
=== app.js === |
|
|
[complete JavaScript content] |
|
|
|
|
|
=== worker.js === |
|
|
[web worker content - if needed] |
|
|
|
|
|
**π¨ CRITICAL: Best Practices** |
|
|
- Use CDN for transformers.js: https://cdn.jsdelivr.net/npm/@huggingface/transformers |
|
|
- Implement loading states and progress indicators |
|
|
- Use Web Workers for model loading to avoid blocking UI |
|
|
- Handle errors gracefully with user-friendly messages |
|
|
- Show model download progress when applicable |
|
|
- Use quantized models (q8, q4) for faster loading in browser |
|
|
|
|
|
Requirements: |
|
|
1. Create a modern, responsive web application |
|
|
2. Use appropriate transformers.js pipelines and models |
|
|
3. Include proper error handling and loading states |
|
|
4. Implement progress indicators for model loading |
|
|
5. Add helpful descriptions and examples |
|
|
6. Follow browser best practices (async/await, Web Workers, etc.) |
|
|
7. Make the UI user-friendly with clear labels |
|
|
8. Include proper comments in code |
|
|
|
|
|
IMPORTANT: Always include "Built with anycoder" as clickable text in the header/top section of your application that links to https://huggingface.co/spaces/akhaliq/anycoder |
|
|
|
|
|
--- |
|
|
|
|
|
## Complete transformers.js Documentation |
|
|
|
|
|
Below is the complete, official transformers.js documentation automatically synced from https://huggingface.co/docs/transformers.js/llms.txt: |
|
|
|
|
|
""" |
|
|
|
|
|
|
|
|
full_prompt = base_prompt + docs_content |
|
|
|
|
|
|
|
|
final_instructions = """ |
|
|
|
|
|
--- |
|
|
|
|
|
## Final Instructions |
|
|
|
|
|
- Always use the exact function signatures and patterns from the transformers.js documentation above |
|
|
- Use the pipeline() API for common tasks |
|
|
- Implement WebGPU support when appropriate for better performance |
|
|
- Use quantized models by default (q8 or q4) for faster browser loading |
|
|
- Generate production-ready code that follows all best practices |
|
|
- Always include the "Built with anycoder" attribution in the header |
|
|
- Consider using Web Workers for heavy computation to keep UI responsive |
|
|
|
|
|
""" |
|
|
|
|
|
return full_prompt + final_instructions |
|
|
|
|
|
def initialize_backend_docs(): |
|
|
"""Initialize backend documentation system on startup""" |
|
|
try: |
|
|
|
|
|
gradio_docs = get_gradio_docs_content() |
|
|
if gradio_docs: |
|
|
print(f"π Gradio documentation initialized ({len(gradio_docs)} chars loaded)") |
|
|
else: |
|
|
print("β οΈ Gradio documentation initialized with fallback content") |
|
|
|
|
|
|
|
|
transformersjs_docs = get_transformersjs_docs_content() |
|
|
if transformersjs_docs: |
|
|
print(f"π transformers.js documentation initialized ({len(transformersjs_docs)} chars loaded)") |
|
|
else: |
|
|
print("β οΈ transformers.js documentation initialized with fallback content") |
|
|
|
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to initialize backend documentation: {e}") |
|
|
|
|
|
|
|
|
if __name__ != "__main__": |
|
|
|
|
|
try: |
|
|
initialize_backend_docs() |
|
|
except Exception as e: |
|
|
print(f"Warning: Failed to auto-initialize backend docs: {e}") |
|
|
|
|
|
|