JatinAutonomousLabs commited on
Commit
fd88fa8
·
verified ·
1 Parent(s): 5d37f3d

Update .env

Browse files
Files changed (1) hide show
  1. .env +13 -5
.env CHANGED
@@ -10,6 +10,7 @@
10
  # Get your API key from: https://novita.ai
11
  NOVITA_API_KEY=sk_gaMaeJaUy-qQxms1NIgJuov_RotL_NZXMoQbJlNhS6M
12
 
 
13
  # Dedicated endpoint base URL (default for dedicated endpoints)
14
  NOVITA_BASE_URL=https://api.novita.ai/dedicated/v1/openai
15
 
@@ -31,19 +32,25 @@ DEEPSEEK_R1_FORCE_REASONING=True
31
  # Token Allocation Configuration
32
  # =============================================================================
33
  # Maximum tokens dedicated for user input (prioritized over context)
34
- # Recommended: 8000 tokens for large queries
35
- USER_INPUT_MAX_TOKENS=8000
36
 
37
  # Maximum tokens for context preparation (includes user input + context)
38
- # Recommended: 28000 tokens for 32K context window models
39
- CONTEXT_PREPARATION_BUDGET=28000
40
 
41
  # Context pruning threshold (should match context_preparation_budget)
42
- CONTEXT_PRUNING_THRESHOLD=28000
43
 
44
  # Always prioritize user input over historical context
45
  PRIORITIZE_USER_INPUT=True
46
 
 
 
 
 
 
 
47
  # =============================================================================
48
  # Database Configuration
49
  # =============================================================================
@@ -161,3 +168,4 @@ CONTEXT_SYNTHESIS_MODEL=Qwen/Qwen2.5-7B-Instruct
161
  # - Use environment variables in production (not .env files)
162
  # - Set proper file permissions: chmod 600 .env
163
 
 
 
10
  # Get your API key from: https://novita.ai
11
  NOVITA_API_KEY=sk_gaMaeJaUy-qQxms1NIgJuov_RotL_NZXMoQbJlNhS6M
12
 
13
+
14
  # Dedicated endpoint base URL (default for dedicated endpoints)
15
  NOVITA_BASE_URL=https://api.novita.ai/dedicated/v1/openai
16
 
 
32
  # Token Allocation Configuration
33
  # =============================================================================
34
  # Maximum tokens dedicated for user input (prioritized over context)
35
+ # Recommended: 32000 tokens for DeepSeek R1 (128K context window)
36
+ USER_INPUT_MAX_TOKENS=32000
37
 
38
  # Maximum tokens for context preparation (includes user input + context)
39
+ # Recommended: 115000 tokens for DeepSeek R1 (leaves ~13K for output)
40
+ CONTEXT_PREPARATION_BUDGET=115000
41
 
42
  # Context pruning threshold (should match context_preparation_budget)
43
+ CONTEXT_PRUNING_THRESHOLD=115000
44
 
45
  # Always prioritize user input over historical context
46
  PRIORITIZE_USER_INPUT=True
47
 
48
+ # Model context window (actual limit for your deployed model)
49
+ # Default: 128000 tokens for DeepSeek R1 (128K context window)
50
+ # This is the maximum total tokens (input + output) the model can handle
51
+ # Take full advantage of DeepSeek R1's 128K capability
52
+ NOVITA_MODEL_CONTEXT_WINDOW=128000
53
+
54
  # =============================================================================
55
  # Database Configuration
56
  # =============================================================================
 
168
  # - Use environment variables in production (not .env files)
169
  # - Set proper file permissions: chmod 600 .env
170
 
171
+