Spaces:

AF-LLM
/

AF-LLM

Sleeping

App Files Files Community

fanqiNO1 commited on 30 days ago

Commit

5bb3b8f

1 Parent(s): b3cf69c

init

Browse files

Files changed (17) hide show

Dockerfile +60 -0
backend/api.py +173 -0
backend/requirements.txt +12 -0
components.json +21 -0
next-env.d.ts +5 -0
next.config.mjs +48 -0
package.json +80 -0
pnpm-lock.yaml +0 -0
postcss.config.mjs +8 -0
public/placeholder-logo.png +0 -0
public/placeholder-logo.svg +1 -0
public/placeholder-user.jpg +0 -0
public/placeholder.jpg +0 -0
public/placeholder.svg +1 -0
public/reports/technical-report.md +157 -0
tailwind.config.ts +133 -0
tsconfig.json +27 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,60 @@

+# 多阶段构建: 第一阶段构建Next.js前端
+FROM node:18-alpine AS frontend-builder
+WORKDIR /app
+RUN npm install -g pnpm
+FROM python:3.10
+RUN useradd -m -u 1000 user
+ENV PATH="/home/user/.local/bin:$PATH"
+WORKDIR /app
+# RUN apt-get update && apt-get install -y \
+#     curl \
+#     gnupg \
+#     && curl -fsSL https://deb.nodesource.com/setup_18.x | bash - \
+#     && apt-get install -y nodejs \
+#     && npm install -g pnpm \
+#     && apt-get clean \
+#     && rm -rf /var/lib/apt/lists/*
+COPY --chown=user requirements.txt .
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+# 复制前端构建产物
+COPY --chown=user .next ./.next
+COPY --chown=user public ./public
+COPY --chown=user package.json ./package.json
+COPY --chown=user pnpm-lock.yaml ./pnpm-lock.yaml
+COPY --chown=user next.config.js ./next.config.js
+RUN pnpm install --prod
+# 复制后端代码和配置目录
+COPY --chown=user backend ./backend
+COPY --chown=user public/reports ./public/reports
+# 创建配置目录
+RUN mkdir -p /app/config && chown user:user /app/config
+# 切换到非root用户
+USER user
+# 设置环境变量
+ENV NODE_ENV=production
+ENV NEXT_PUBLIC_API_URL=/api
+ENV PORT=7860
+# 暴露Hugging Face要求的端口
+EXPOSE 7860
+# 创建启动脚本
+RUN echo '#!/bin/bash\n\
+python backend/api.py &\n\
+pnpm start -p 7860' > /app/start.sh && chmod +x /app/start.sh
+# 启动应用
+CMD ["/app/start.sh"]

backend/api.py ADDED Viewed

	@@ -0,0 +1,173 @@

+import os
+import uvicorn
+import json
+import time
+from fastapi import FastAPI, HTTPException, WebSocket, WebSocketDisconnect
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer, logging
+# 设置日志级别
+logging.set_verbosity_info()
+print("正在初始化AF-LLM模型服务...")
+# 设备选择
+device = "cuda:0" if torch.cuda.is_available() else "cpu"
+print(f"使用设备: {device}")
+# 预加载模型
+token = os.environ.get("HF_TOKEN")
+print("开始下载并加载模型，这可能需要几分钟时间...")
+start_time = time.time()
+try:
+    # 下载并加载模型
+    model = AutoModelForCausalLM.from_pretrained("Safphere/AF-LLM",
+                                                trust_remote_code=True,
+                                                torch_dtype=torch.float16,
+                                                device_map=device,
+                                                token=token)
+    tokenizer = AutoTokenizer.from_pretrained("Safphere/AF-LLM", token=token)
+    load_time = time.time() - start_time
+    print(f"✅ 模型加载完成! 耗时: {load_time:.2f}秒")
+    print(f"模型已准备就绪，可以开始聊天")
+except Exception as e:
+    print(f"❌ 模型加载失败: {str(e)}")
+    raise
+# FastAPI 应用
+app = FastAPI()
+# 添加CORS中间件
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # 允许所有来源，生产环境中应该限制
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# 存储WebSocket连接
+active_connections = {}
+# 存储每个连接的Magic模式状态
+magic_mode_status = {}
+# 存储历史记录
+history_dict = {}
+class ChatRequest(BaseModel):
+    session_id: str
+    prompt: str
+    use_magic: bool = True
+class ClearHistoryRequest(BaseModel):
+    session_id: str
+@app.post("/chat")
+async def chat(request: ChatRequest):
+    if request.session_id not in history_dict:
+        history_dict[request.session_id] = []
+    history = history_dict[request.session_id]
+    try:
+        length = 0
+        response_text = ""
+        for response, history in model.stream_chat(tokenizer, request.prompt, history, use_magic=request.use_magic):
+            response_text += response[length:]
+            length = len(response)
+        # 更新会话历史
+        history_dict[request.session_id] = history
+        return {"response": response_text}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/clear_history")
+async def clear_history(request: ClearHistoryRequest):
+    if request.session_id in history_dict:
+        del history_dict[request.session_id]
+    return {"message": "Chat history cleared"}
+@app.get("/health")
+async def health_check():
+    # 检查模型是否已加载
+    if 'model' in globals() and model is not None:
+        return {"status": "ok", "model_loaded": True, "device": device}
+    else:
+        return {"status": "error", "model_loaded": False, "message": "模型未加载"}
+@app.websocket("/ws")
+async def websocket_endpoint(websocket: WebSocket):
+    await websocket.accept()
+    connection_id = id(websocket)
+    active_connections[connection_id] = websocket
+    magic_mode_status[connection_id] = True  # 默认启用Magic模式
+    history = []
+    try:
+        while True:
+            data = await websocket.receive_text()
+            # 处理命令
+            if data.startswith("COMMAND:"):
+                command = data[8:]
+                if command == "CLEAR_HISTORY":
+                    history = []
+                    await websocket.send_text("历史记录已清空")
+                elif command.startswith("SET_MAGIC:"):
+                    magic_value = command[10:].lower() == "true"
+                    magic_mode_status[connection_id] = magic_value
+                    await websocket.send_text(f"Magic模式已{'启用' if magic_value else '禁用'}")
+            # 处理普通消息
+            else:
+                use_magic = magic_mode_status.get(connection_id, True)
+                # 检查是否有Magic标记
+                if data.startswith("[MAGIC]:"):
+                    prompt = data[8:]
+                    use_magic = True
+                else:
+                    prompt = data
+                try:
+                    # 流式生成回复
+                    length = 0
+                    for response, history in model.stream_chat(tokenizer, prompt, history, use_magic=use_magic):
+                        # 只发送新增的部分
+                        new_content = response[length:]
+                        if new_content:
+                            await websocket.send_text(new_content)
+                        length = len(response)
+                    # 发送完成标记
+                    await websocket.send_text("[DONE]")
+                except Exception as e:
+                    error_message = f"生成回复时发生错误: {str(e)}"
+                    await websocket.send_text(error_message)
+                    await websocket.send_text("[DONE]")  # 即使出错也发送完成标记
+                    print(f"用户 {connection_id} 的消息处理出错: {error_message}")
+    except WebSocketDisconnect:
+        if connection_id in active_connections:
+            del active_connections[connection_id]
+        if connection_id in magic_mode_status:
+            del magic_mode_status[connection_id]
+        print(f"用户 {connection_id} 已断开连接")
+    except Exception as e:
+        error_message = f"错误: {str(e)}"
+        try:
+            await websocket.send_text(error_message)
+            await websocket.send_text("[DONE]")  # 即使出错也发送完成标记
+        except:
+            pass  # 如果无法发送错误消息（可能连接已断开），则忽略
+        print(f"WebSocket连接 {connection_id} 发生错误: {error_message}")
+        if connection_id in active_connections:
+            del active_connections[connection_id]
+        if connection_id in magic_mode_status:
+            del magic_mode_status[connection_id]
+if __name__ == "__main__":
+    uvicorn.run(app, host="127.0.0.1", port=8000)

backend/requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+fastapi
+uvicorn
+pydantic
+python-dotenv
+pyyaml
+transformers
+torch
+sentencepiece
+accelerate
+peft

components.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "$schema": "https://ui.shadcn.com/schema.json",
+  "style": "default",
+  "rsc": true,
+  "tsx": true,
+  "tailwind": {
+    "config": "tailwind.config.ts",
+    "css": "app/globals.css",
+    "baseColor": "neutral",
+    "cssVariables": true,
+    "prefix": ""
+  },
+  "aliases": {
+    "components": "@/components",
+    "utils": "@/lib/utils",
+    "ui": "@/components/ui",
+    "lib": "@/lib",
+    "hooks": "@/hooks"
+  },
+  "iconLibrary": "lucide"
+}

next-env.d.ts ADDED Viewed

	@@ -0,0 +1,5 @@

+/// <reference types="next" />
+/// <reference types="next/image-types/global" />
+// NOTE: This file should not be edited
+// see https://nextjs.org/docs/app/api-reference/config/typescript for more information.

next.config.mjs ADDED Viewed

	@@ -0,0 +1,48 @@

+let userConfig = undefined
+try {
+  userConfig = await import('./v0-user-next.config')
+} catch (e) {
+  // ignore error
+}
+/** @type {import('next').NextConfig} */
+const nextConfig = {
+  eslint: {
+    ignoreDuringBuilds: true,
+  },
+  typescript: {
+    ignoreBuildErrors: true,
+  },
+  images: {
+    unoptimized: true,
+  },
+  experimental: {
+    webpackBuildWorker: true,
+    parallelServerBuildTraces: true,
+    parallelServerCompiles: true,
+  },
+}
+mergeConfig(nextConfig, userConfig)
+function mergeConfig(nextConfig, userConfig) {
+  if (!userConfig) {
+    return
+  }
+  for (const key in userConfig) {
+    if (
+      typeof nextConfig[key] === 'object' &&
+      !Array.isArray(nextConfig[key])
+    ) {
+      nextConfig[key] = {
+        ...nextConfig[key],
+        ...userConfig[key],
+      }
+    } else {
+      nextConfig[key] = userConfig[key]
+    }
+  }
+}
+export default nextConfig

package.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "name": "my-v0-project",
+  "version": "0.1.0",
+  "private": true,
+  "scripts": {
+    "dev": "next dev",
+    "build": "next build",
+    "start": "next start",
+    "lint": "next lint"
+  },
+  "dependencies": {
+    "@hookform/resolvers": "^3.9.1",
+    "@radix-ui/react-accordion": "^1.2.2",
+    "@radix-ui/react-alert-dialog": "^1.1.4",
+    "@radix-ui/react-aspect-ratio": "^1.1.1",
+    "@radix-ui/react-avatar": "^1.1.2",
+    "@radix-ui/react-checkbox": "^1.1.3",
+    "@radix-ui/react-collapsible": "^1.1.2",
+    "@radix-ui/react-context-menu": "^2.2.4",
+    "@radix-ui/react-dialog": "^1.1.4",
+    "@radix-ui/react-dropdown-menu": "^2.1.4",
+    "@radix-ui/react-hover-card": "^1.1.4",
+    "@radix-ui/react-label": "^2.1.1",
+    "@radix-ui/react-menubar": "^1.1.4",
+    "@radix-ui/react-navigation-menu": "^1.2.3",
+    "@radix-ui/react-popover": "^1.1.4",
+    "@radix-ui/react-progress": "^1.1.1",
+    "@radix-ui/react-radio-group": "^1.2.2",
+    "@radix-ui/react-scroll-area": "^1.2.2",
+    "@radix-ui/react-select": "^2.1.4",
+    "@radix-ui/react-separator": "^1.1.1",
+    "@radix-ui/react-slider": "^1.2.2",
+    "@radix-ui/react-slot": "^1.1.1",
+    "@radix-ui/react-switch": "^1.1.2",
+    "@radix-ui/react-tabs": "^1.1.2",
+    "@radix-ui/react-toast": "^1.2.4",
+    "@radix-ui/react-toggle": "^1.1.1",
+    "@radix-ui/react-toggle-group": "^1.1.1",
+    "@radix-ui/react-tooltip": "^1.1.6",
+    "@types/uuid": "^10.0.0",
+    "autoprefixer": "^10.4.20",
+    "class-variance-authority": "^0.7.1",
+    "clsx": "^2.1.1",
+    "cmdk": "1.0.4",
+    "date-fns": "4.1.0",
+    "embla-carousel-react": "8.5.1",
+    "input-otp": "1.4.1",
+    "katex": "^0.16.21",
+    "lucide-react": "^0.454.0",
+    "next": "15.1.0",
+    "next-themes": "^0.4.4",
+    "react": "^19",
+    "react-day-picker": "8.10.1",
+    "react-dom": "^19",
+    "react-hook-form": "^7.54.1",
+    "react-katex": "^3.0.1",
+    "react-markdown": "^10.1.0",
+    "react-resizable-panels": "^2.1.7",
+    "recharts": "2.15.0",
+    "rehype-raw": "^7.0.0",
+    "rehype-sanitize": "^6.0.0",
+    "rehype-stringify": "^10.0.1",
+    "remark-gfm": "^4.0.1",
+    "sonner": "^1.7.1",
+    "tailwind-merge": "^2.5.5",
+    "tailwindcss-animate": "^1.0.7",
+    "uuid": "^11.1.0",
+    "vaul": "^0.9.6",
+    "zod": "^3.24.1"
+  },
+  "devDependencies": {
+    "@tailwindcss/typography": "^0.5.16",
+    "@types/node": "^22",
+    "@types/react": "^19",
+    "@types/react-dom": "^19",
+    "postcss": "^8",
+    "tailwindcss": "^3.4.17",
+    "typescript": "^5"
+  }
+}

pnpm-lock.yaml ADDED Viewed

The diff for this file is too large to render. See raw diff

postcss.config.mjs ADDED Viewed

	@@ -0,0 +1,8 @@

+/** @type {import('postcss-load-config').Config} */
+const config = {
+  plugins: {
+    tailwindcss: {},
+  },
+};
+export default config;

public/placeholder-logo.png ADDED Viewed

public/placeholder-logo.svg ADDED Viewed

public/placeholder-user.jpg ADDED Viewed

public/placeholder.jpg ADDED Viewed

public/placeholder.svg ADDED Viewed

public/reports/technical-report.md ADDED Viewed

	@@ -0,0 +1,157 @@

+# AF-LLM: A Practical Hybrid Intelligent Routing Architecture
+*Technical Report v2.0 | March 30, 2025 | Safphere Team*
+## Abstract
+We present AF-LLM, an innovative hybrid AI model architecture that automatically selects between DeepSeek-V3 level cloud API and optimized edge models through its built-in Magic intelligent routing module. This design enables optimal performance and throughput across various environments while respecting user privacy and resource constraints. Our model introduces several key innovations: (1) an intelligent routing mechanism that dynamically selects the most appropriate processing method based on input complexity and task type; (2) edge model optimization techniques that provide acceptable performance under limited resources; and (3) a seamless switching mechanism that ensures fluid user experience. In comprehensive evaluations, AF-LLM with Magic enabled demonstrates significant advantages in complex reasoning, knowledge breadth, code generation, creative writing, and problem-solving. We discuss the implications of these advancements for practical AI applications and outline directions for future research.
+## 1. Introduction
+Large language models (LLMs) have revolutionized artificial intelligence, demonstrating remarkable capabilities in natural language understanding, generation, and reasoning. However, current state-of-the-art models face several key challenges: deployment environment diversity, computational resource limitations, privacy and security concerns, and the contradiction between high performance and local processing capabilities.
+In this report, we introduce AF-LLM, a novel architecture designed to address these limitations while pushing the boundaries of what is possible with language models. AF-LLM builds upon hybrid intelligent processing, automatically selecting the most appropriate processing method based on task characteristics through an intelligent routing mechanism. Our primary contributions include:
+- The Magic intelligent routing module that dynamically evaluates input complexity and makes optimal choices between local and cloud processing
+- A privacy-first processing strategy that ensures sensitive information is processed locally whenever possible
+- A flexible deployment framework that adapts to various scenarios, from resource-constrained devices to high-performance environments
+- Comprehensive evaluations demonstrating performance differences with Magic enabled versus disabled across various tasks
+The remainder of this report is organized as follows: Section 2 reviews related work, Section 3 describes the AF-LLM architecture and methodology, Section 4 presents experimental results, Section 5 discusses implications and limitations, and Section 6 concludes with directions for future research.
+## 2. Related Work
+The development of large language models has a rich history, evolving from early neural network approaches to recurrent neural networks, and finally to Transformer-based architectures. The Transformer, introduced by Vaswani et al. (2017), has become the foundation for modern language models. Subsequent research has focused on scaling these models, improving their efficiency, enhancing reasoning capabilities, and multimodal integration.
+In recent years, hybrid processing architectures have gained increasing attention, particularly in edge computing and mobile environments. Some research explores how to deploy large models on devices with limited performance, using techniques such as model compression, knowledge distillation, and sparse computation. On the other hand, cloud API services continue to evolve, offering high performance, real-time knowledge updates, and powerful reasoning capabilities.
+In terms of privacy protection and resource efficiency, researchers have proposed various methods to balance performance and privacy, including federated learning, differential privacy, and local processing priority policies. Edge-cloud collaborative computing has emerged as a new field aiming to combine the privacy advantages of edge devices with the powerful performance of cloud computing.
+Our work builds upon these advances while introducing innovative architectural and methodological innovations that address key limitations of existing approaches.
+## 3. AF-LLM Architecture and Methodology
+### 3.1 Overall Architecture
+The core of AF-LLM is the Magic intelligent routing module, which dynamically assesses the complexity and type of input queries, then decides whether to use the local optimized model or call a cloud API. This architecture enables the system to provide consistent performance across different environments while adapting to available resources and privacy requirements.
+The overall architecture includes the following main components:
+1. **Input Analyzer**: Evaluates query complexity, sensitivity, and required knowledge scope
+2. **Decision Engine**: Determines routing strategy based on analysis results, user preferences, and available resources
+3. **Local Processing Module**: Runs optimized edge models suitable for resource-constrained environments
+4. **Cloud Connector**: Securely and efficiently communicates with DeepSeek-V3 level cloud APIs
+5. **Response Integrator**: Ensures consistent and fluid user experience regardless of processing method
+The Magic module employs a multi-factor decision algorithm that considers input complexity, task type, computational resource availability, network conditions, and privacy settings. When processing simple queries or sensitive information, the system tends to use local models; for complex reasoning, tasks requiring up-to-date knowledge, or computation-intensive tasks, the system routes to cloud APIs.
+### 3.2 Intelligent Routing Strategy
+At the core of the Magic intelligent routing module is a carefully designed set of routing strategies, including:
+1. **Task Classification**: Categorizes input queries into multiple complexity levels and task types, such as simple Q&A, knowledge retrieval, creative generation, or complex reasoning
+2. **Resource Awareness**: Real-time monitoring of device computational capacity, memory, battery status, and network conditions
+3. **Privacy Assessment**: Identifies sensitive information in queries and determines processing methods based on user settings
+4. **Adaptive Thresholds**: Dynamically adjusts routing decision thresholds based on historical performance and user feedback
+The local processing module employs techniques such as quantization, pruning, and knowledge distillation to ensure reasonable performance even in resource-constrained environments. The cloud connector implements secure, efficient API calls, including request compression, incremental transmission, and breakpoint continuation features.
+### 3.3 Privacy Protection Mechanisms
+AF-LLM adopts a "privacy-first" design principle, including the following key mechanisms:
+1. **Local Priority Processing**: By default, sensitive information is processed locally whenever possible
+2. **Data Minimization**: When cloud services must be used, only necessary information is transmitted
+3. **User Control**: Provides clear, intuitive control interfaces that allow users to decide the balance between privacy and performance
+4. **Transparency**: Clearly displays current processing mode and data flow direction
+Through these mechanisms, AF-LLM respects user privacy and resource constraints while providing high-performance services.
+## 4. Experimental Results
+### 4.1 Performance Comparison
+We evaluated AF-LLM's performance across multiple dimensions, with particular focus on differences between Magic enabled and disabled states. Table 1 shows performance comparisons across different capability dimensions.
+**Table 1: Capability Comparison with Magic Enabled vs. Disabled (Percentage Scores)**
+| Capability Dimension | Magic Enabled | Magic Disabled | Difference |
+|----------------------|---------------|----------------|------------|
+| Complex Reasoning    | 88.5%         | 14.2%          | +74.3%     |
+| Knowledge Breadth    | 75.9%         | 12.8%          | +63.1%     |
+| Code Generation      | 82.6%         | 13.5%          | +69.1%     |
+| Creative Writing     | 95.3%         | 14.8%          | +80.5%     |
+| Problem Solving      | 91.6%         | 14.5%          | +77.1%     |
+The results demonstrate that with Magic enabled, performance improves significantly across all dimensions, particularly in creative writing and problem-solving. This confirms the effectiveness of the intelligent routing mechanism in selecting the most appropriate processing method.
+### 4.2 Multimodal Capability Analysis
+Beyond basic text processing, we assessed AF-LLM's ability to handle various tasks in different modes. Figure 1 shows a radar chart comparison across eight key capability dimensions.
+With Magic enabled, the model performs excellently in role-playing, contextual dialogue, casual chat, semantic understanding, calculation, logical reasoning, knowledge, and creative generation, with scores ranging from 85 to 93. When Magic is disabled, scores in all dimensions are in single digits, showing a clear capability gap.
+### 4.3 Practical Scenario Evaluation
+We tested AF-LLM in multiple real-world application scenarios, including:
+1. **Resource-Constrained Devices**: Evaluating performance in low-memory, low-CPU environments
+2. **Weak Network and Offline Environments**: Testing adaptability in unstable network conditions and completely offline situations
+3. **Multi-User Shared Environments**: Analyzing resource allocation and performance guarantees during concurrent access by multiple users
+4. **Privacy-Sensitive Applications**: Assessing privacy protection effectiveness when handling sensitive information in healthcare, finance, etc.
+Results show that AF-LLM can intelligently adjust processing strategies according to different scenarios, adapting to various environmental constraints while ensuring user experience.
+## 5. Discussion and Limitations
+### 5.1 Application Significance
+The advances in AF-LLM architecture have several important implications for AI applications:
+1. **Universality**: Through intelligent routing mechanisms, advanced AI capabilities are available in various environments, regardless of hardware limitations
+2. **Privacy Protection**: Achieves a balance between high performance and data privacy, making AI technology applicable to sensitive domains
+3. **Resource Efficiency**: Dynamically allocates resources based on task complexity, avoiding unnecessary computational waste
+4. **User Control**: Gives users more control over AI systems, allowing them to adjust the balance between privacy and performance according to their needs
+### 5.2 Limitations
+Despite progress, AF-LLM still has some limitations:
+1. **Decision Algorithm Dependence**: The effectiveness of intelligent routing largely depends on the accuracy of the decision algorithm, which may misjudge
+2. **Cloud Service Dependence**: For complex tasks, there is still reliance on cloud services, with significant performance degradation when cloud services are unavailable
+3. **Mode Switching Transition**: When switching between local and cloud processing, there may be latency or inconsistency
+4. **Evaluation Gaps**: Current evaluations may not fully capture all scenarios and requirements in practical applications
+## 6. Conclusion and Future Work
+We have presented AF-LLM, an innovative hybrid AI model architecture that enables dynamic switching between local processing and cloud APIs through the Magic intelligent routing module. Experimental results show that this architecture can provide excellent performance and flexibility while protecting privacy and adapting to resource constraints.
+Future work will focus on several directions:
+1. **Decision Algorithm Optimization**: Further improve intelligent routing decision algorithms to enhance accuracy and robustness
+2. **Local Model Enhancement**: Develop more efficient model compression and optimization techniques to boost local processing capabilities
+3. **Multimodal Extensions**: Extend the hybrid processing architecture to image, audio, and other multimodal inputs
+4. **Customization**: Provide more granular user control options, supporting domain-specific optimization configurations
+5. **Privacy-Enhancing Technologies**: Integrate more advanced privacy protection technologies, such as federated learning and homomorphic encryption
+We believe that AF-LLM represents an important direction in AI system design, intelligently balancing performance, resource, and privacy needs to enable broader and safer application of AI technology across various practical scenarios.
+## References
+1. Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A. N., Kaiser, L., & Polosukhin, I. (2017). Attention is all you need. In Advances in Neural Information Processing Systems.
+2. Brown, T. B., Mann, B., Ryder, N., Subbiah, M., Kaplan, J., Dhariwal, P., ... & Amodei, D. (2020). Language models are few-shot learners. In Advances in Neural Information Processing Systems.
+3. Touvron, H., Lavril, T., Izacard, G., Martinet, X., Lachaux, M., Lacroix, T., ... & Lample, G. (2023). LLaMA: Open and Efficient Foundation Language Models. arXiv preprint arXiv:2302.13971.
+4. Chowdhery, A., Narang, S., Devlin, J., Bosma, M., Mishra, G., Roberts, A., ... & Fiedel, N. (2022). PaLM: Scaling language modeling with pathways. arXiv preprint arXiv:2204.02311.
+5. Wei, J., Wang, X., Schuurmans, D., Bosma, M., Ichter, B., Xia, F., ... & Zhou, D. (2022). Chain-of-thought prompting elicits reasoning in large language models. In Advances in Neural Information Processing Systems.
+6. Li, S., Zhao, S., Hou, L., Yao, Y., Guo, D., Han, J. (2024). EdgeLLM: Efficient On-Device LLM Inference with Adaptive Computation. Transactions on Machine Learning Research.
+7. Zhang, T., Wang, Z., Zhou, J. (2024). Hybrid Cloud-Edge AI Systems: Architectures, Applications, and Future Directions. IEEE Computing Surveys.
+8. Chen, H., Liu, X., Yin, W. (2025). Privacy-Preserving LLM Communication Protocols for Multi-Party Computing. Proceedings of the Conference on Privacy Enhancing Technologies.
+9. Safphere Team (2025). Magic Intelligent Routing: Dynamic Decision Making in Hybrid AI Systems. arXiv preprint arXiv:2502.14853.

tailwind.config.ts ADDED Viewed

	@@ -0,0 +1,133 @@

+import type { Config } from "tailwindcss"
+const config = {
+  darkMode: ["class"],
+  content: [
+    "./pages/**/*.{ts,tsx}",
+    "./components/**/*.{ts,tsx}",
+    "./app/**/*.{ts,tsx}",
+    "./src/**/*.{ts,tsx}",
+    "*.{js,ts,jsx,tsx,mdx}",
+  ],
+  prefix: "",
+  theme: {
+    container: {
+      center: true,
+      padding: "2rem",
+      screens: {
+        "2xl": "1400px",
+      },
+    },
+    extend: {
+      colors: {
+        border: "hsl(var(--border))",
+        input: "hsl(var(--input))",
+        ring: "hsl(var(--ring))",
+        background: "hsl(var(--background))",
+        foreground: "hsl(var(--foreground))",
+        primary: {
+          DEFAULT: "hsl(var(--primary))",
+          foreground: "hsl(var(--primary-foreground))",
+        },
+        secondary: {
+          DEFAULT: "hsl(var(--secondary))",
+          foreground: "hsl(var(--secondary-foreground))",
+        },
+        destructive: {
+          DEFAULT: "hsl(var(--destructive))",
+          foreground: "hsl(var(--destructive-foreground))",
+        },
+        muted: {
+          DEFAULT: "hsl(var(--muted))",
+          foreground: "hsl(var(--muted-foreground))",
+        },
+        accent: {
+          DEFAULT: "hsl(var(--accent))",
+          foreground: "hsl(var(--accent-foreground))",
+        },
+        popover: {
+          DEFAULT: "hsl(var(--popover))",
+          foreground: "hsl(var(--popover-foreground))",
+        },
+        card: {
+          DEFAULT: "hsl(var(--card))",
+          foreground: "hsl(var(--card-foreground))",
+        },
+      },
+      borderRadius: {
+        lg: "var(--radius)",
+        md: "calc(var(--radius) - 2px)",
+        sm: "calc(var(--radius) - 4px)",
+      },
+      keyframes: {
+        "accordion-down": {
+          from: { height: "0" },
+          to: { height: "var(--radix-accordion-content-height)" },
+        },
+        "accordion-up": {
+          from: { height: "var(--radix-accordion-content-height)" },
+          to: { height: "0" },
+        },
+        "fade-in": {
+          "0%": { opacity: "0" },
+          "100%": { opacity: "1" }
+        },
+        "fade-out": {
+          "0%": { opacity: "1" },
+          "100%": { opacity: "0" }
+        },
+        "slide-up": {
+          "0%": { transform: "translateY(10px)", opacity: "0" },
+          "100%": { transform: "translateY(0)", opacity: "1" }
+        },
+        "slide-down": {
+          "0%": { transform: "translateY(-10px)", opacity: "0" },
+          "100%": { transform: "translateY(0)", opacity: "1" }
+        },
+        "pulse": {
+          "0%, 100%": { opacity: "1" },
+          "50%": { opacity: "0.5" }
+        },
+        "float": {
+          "0%, 100%": { transform: "translateY(0)" },
+          "50%": { transform: "translateY(-10px)" }
+        },
+        "float-pulse": {
+          "0%": { transform: "translateY(0) scale(1)", opacity: "0.1" },
+          "50%": { transform: "translateY(-8px) scale(1.05)", opacity: "0.2" },
+          "100%": { transform: "translateY(0) scale(1)", opacity: "0.1" }
+        },
+        "glow": {
+          "0%, 100%": { boxShadow: "0 0 5px rgba(147, 51, 234, 0.3)" },
+          "50%": { boxShadow: "0 0 20px rgba(147, 51, 234, 0.6)" }
+        },
+        "rotate-slow": {
+          "0%": { transform: "rotate(0deg)" },
+          "100%": { transform: "rotate(360deg)" }
+        },
+        "shimmer": {
+          "0%": { backgroundPosition: "-200% 0" },
+          "100%": { backgroundPosition: "200% 0" }
+        }
+      },
+      animation: {
+        "accordion-down": "accordion-down 0.2s ease-out",
+        "accordion-up": "accordion-up 0.2s ease-out",
+        "fade-in": "fade-in 0.5s ease-out",
+        "fade-out": "fade-out 0.5s ease-out",
+        "slide-up": "slide-up 0.6s ease-out",
+        "slide-down": "slide-down 0.6s ease-out",
+        "pulse": "pulse 3s ease-in-out infinite",
+        "float": "float 6s ease-in-out infinite",
+        "float-pulse": "float-pulse 7s ease-in-out infinite",
+        "glow": "glow 2s ease-in-out infinite",
+        "rotate-slow": "rotate-slow 8s linear infinite",
+        "shimmer": "shimmer 3s linear infinite"
+      },
+    },
+  },
+  plugins: [require("tailwindcss-animate"), require("@tailwindcss/typography")],
+} satisfies Config
+export default config

tsconfig.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "compilerOptions": {
+    "lib": ["dom", "dom.iterable", "esnext"],
+    "allowJs": true,
+    "target": "ES6",
+    "skipLibCheck": true,
+    "strict": true,
+    "noEmit": true,
+    "esModuleInterop": true,
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "resolveJsonModule": true,
+    "isolatedModules": true,
+    "jsx": "preserve",
+    "incremental": true,
+    "plugins": [
+      {
+        "name": "next"
+      }
+    ],
+    "paths": {
+      "@/*": ["./*"]
+    }
+  },
+  "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
+  "exclude": ["node_modules"]
+}